[
  {
    "gen": 1,
    "reward_mean": -102.38994204638064,
    "reward_max": -85.78293815424496,
    "reward_min": -107.7362176503591,
    "reward_std": 5.336278943221367,
    "timesteps": 46131,
    "learntime": 0.9301888151094317,
    "sampletime": 1.8076134519651532,
    "best_max_mean": -102.38994204638064,
    "best_max": -85.78293815424496
  },
  {
    "gen": 2,
    "reward_mean": -98.87746771859105,
    "reward_max": -75.0038542570264,
    "reward_min": -106.92669570522213,
    "reward_std": 8.38043333365588,
    "timesteps": 104445,
    "learntime": 0.5252543322276324,
    "sampletime": 2.1816633760463446,
    "best_max_mean": -98.87746771859105,
    "best_max": -75.0038542570264
  },
  {
    "gen": 3,
    "reward_mean": -99.60057819517064,
    "reward_max": -71.27210509140019,
    "reward_min": -106.92210351345551,
    "reward_std": 9.034415528427255,
    "timesteps": 159534,
    "learntime": 0.19659214606508613,
    "sampletime": 2.1487562528345734,
    "best_max_mean": -99.60057819517064,
    "best_max": -71.27210509140019
  },
  {
    "gen": 4,
    "reward_mean": -101.2176601159924,
    "reward_max": -65.16843225533904,
    "reward_min": -106.61777130632915,
    "reward_std": 7.486637971714725,
    "timesteps": 206073,
    "learntime": 0.15008568903431296,
    "sampletime": 1.5615969190839678,
    "best_max_mean": -101.2176601159924,
    "best_max": -65.16843225533904
  },
  {
    "gen": 5,
    "reward_mean": -101.65495703856585,
    "reward_max": -75.96398201533663,
    "reward_min": -107.27555255541068,
    "reward_std": 6.530488234217195,
    "timesteps": 255372,
    "learntime": 0.20864144107326865,
    "sampletime": 2.083182480186224,
    "best_max_mean": -101.2176601159924,
    "best_max": -65.16843225533904
  },
  {
    "gen": 6,
    "reward_mean": -98.9521998237791,
    "reward_max": -71.26730342517192,
    "reward_min": -107.7080989997326,
    "reward_std": 8.500026275739765,
    "timesteps": 308571,
    "learntime": 0.13564780913293362,
    "sampletime": 1.9999723308719695,
    "best_max_mean": -101.2176601159924,
    "best_max": -65.16843225533904
  },
  {
    "gen": 7,
    "reward_mean": -99.58582380323205,
    "reward_max": -65.48651768971291,
    "reward_min": -106.89405201994425,
    "reward_std": 9.017732430561066,
    "timesteps": 364761,
    "learntime": 0.1920625080820173,
    "sampletime": 2.027694635093212,
    "best_max_mean": -101.2176601159924,
    "best_max": -65.16843225533904
  },
  {
    "gen": 8,
    "reward_mean": -97.0277302524768,
    "reward_max": -64.06369167835113,
    "reward_min": -107.77877366666993,
    "reward_std": 9.456374919132495,
    "timesteps": 430275,
    "learntime": 0.16453531198203564,
    "sampletime": 2.841265350813046,
    "best_max_mean": -97.0277302524768,
    "best_max": -64.06369167835113
  },
  {
    "gen": 9,
    "reward_mean": -88.93528089997315,
    "reward_max": -48.41550483739454,
    "reward_min": -106.00306195074296,
    "reward_std": 16.15328314281969,
    "timesteps": 517482,
    "learntime": 0.19971034303307533,
    "sampletime": 3.3278583257924765,
    "best_max_mean": -88.93528089997315,
    "best_max": -48.41550483739454
  },
  {
    "gen": 10,
    "reward_mean": -97.7850168084176,
    "reward_max": -56.13470308608234,
    "reward_min": -106.9795834791254,
    "reward_std": 10.297551833955657,
    "timesteps": 573873,
    "learntime": 0.15607388713397086,
    "sampletime": 2.5424914290197194,
    "best_max_mean": -88.93528089997315,
    "best_max": -48.41550483739454
  },
  {
    "gen": 11,
    "reward_mean": -87.2773422771794,
    "reward_max": -57.79720460939589,
    "reward_min": -105.9365183078176,
    "reward_std": 14.769305267636927,
    "timesteps": 664392,
    "learntime": 0.1430875239893794,
    "sampletime": 3.6917873308993876,
    "best_max_mean": -88.93528089997315,
    "best_max": -48.41550483739454
  },
  {
    "gen": 12,
    "reward_mean": -80.42094375647807,
    "reward_max": -27.60276943081144,
    "reward_min": -105.6781937026447,
    "reward_std": 17.863412825985527,
    "timesteps": 781977,
    "learntime": 0.1866715729702264,
    "sampletime": 3.8761617289856076,
    "best_max_mean": -80.42094375647807,
    "best_max": -27.60276943081144
  },
  {
    "gen": 13,
    "reward_mean": -87.72489389132404,
    "reward_max": -35.7486622160597,
    "reward_min": -104.72366602052676,
    "reward_std": 13.737252647383496,
    "timesteps": 867792,
    "learntime": 0.15704470197670162,
    "sampletime": 2.8634610809385777,
    "best_max_mean": -80.42094375647807,
    "best_max": -27.60276943081144
  },
  {
    "gen": 14,
    "reward_mean": -73.09934387798369,
    "reward_max": -27.192279244222764,
    "reward_min": -105.81903668852861,
    "reward_std": 20.82300250068368,
    "timesteps": 996285,
    "learntime": 0.14462578506208956,
    "sampletime": 4.8049883369822055,
    "best_max_mean": -73.09934387798369,
    "best_max": -27.192279244222764
  },
  {
    "gen": 15,
    "reward_mean": -70.19649255630549,
    "reward_max": 2.038026873036428,
    "reward_min": -104.54970959123847,
    "reward_std": 19.696779954194778,
    "timesteps": 1135209,
    "learntime": 0.1440380709245801,
    "sampletime": 4.2982004140503705,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 16,
    "reward_mean": -66.28953162540066,
    "reward_max": -25.654304838221936,
    "reward_min": -105.06073446698825,
    "reward_std": 20.763560450475904,
    "timesteps": 1287507,
    "learntime": 0.20291910297237337,
    "sampletime": 5.134511719923466,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 17,
    "reward_mean": -56.46292248290599,
    "reward_max": -26.285616007435955,
    "reward_min": -103.94754674692045,
    "reward_std": 17.527737724338785,
    "timesteps": 1469853,
    "learntime": 0.1402878570370376,
    "sampletime": 5.780031006084755,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 18,
    "reward_mean": -56.65340986580772,
    "reward_max": -18.630662049166858,
    "reward_min": -103.84975305801454,
    "reward_std": 17.12917695506961,
    "timesteps": 1652412,
    "learntime": 0.2113352408632636,
    "sampletime": 5.026630163891241,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 19,
    "reward_mean": -64.27318182043786,
    "reward_max": -27.532143769630547,
    "reward_min": -104.19052099531065,
    "reward_std": 19.30834453749585,
    "timesteps": 1813989,
    "learntime": 0.18765565403737128,
    "sampletime": 4.916664909105748,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 20,
    "reward_mean": -53.88590894887239,
    "reward_max": -9.949309100312266,
    "reward_min": -93.97195758591548,
    "reward_std": 18.801988237921837,
    "timesteps": 2004750,
    "learntime": 0.1927175698801875,
    "sampletime": 6.123979874886572,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 21,
    "reward_mean": -54.67908825287088,
    "reward_max": -27.73553565392892,
    "reward_min": -94.60309190953603,
    "reward_std": 15.1277704887685,
    "timesteps": 2192406,
    "learntime": 0.14334710291586816,
    "sampletime": 5.89732049102895,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 22,
    "reward_mean": -56.214122348593875,
    "reward_max": -10.258356088828863,
    "reward_min": -95.07827982012972,
    "reward_std": 16.883999753068835,
    "timesteps": 2376036,
    "learntime": 0.1783564940560609,
    "sampletime": 5.853789209155366,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 23,
    "reward_mean": -49.97193416491082,
    "reward_max": -7.984028022736311,
    "reward_min": -104.40096804536316,
    "reward_std": 19.567580376681533,
    "timesteps": 2578344,
    "learntime": 0.14212964591570199,
    "sampletime": 5.59993737610057,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 24,
    "reward_mean": -45.973636347988695,
    "reward_max": 0.8685248612309789,
    "reward_min": -85.73624557396397,
    "reward_std": 19.198646745120275,
    "timesteps": 2794860,
    "learntime": 0.18819585791788995,
    "sampletime": 6.4080397970974445,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 25,
    "reward_mean": -39.502262391974895,
    "reward_max": -8.971229608706906,
    "reward_min": -76.17843568526828,
    "reward_std": 14.273361391918257,
    "timesteps": 3029601,
    "learntime": 0.14761647814884782,
    "sampletime": 6.416189474053681,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 26,
    "reward_mean": -35.38652359541666,
    "reward_max": 0.5135713027028174,
    "reward_min": -78.52739012406933,
    "reward_std": 17.687544327027673,
    "timesteps": 3278337,
    "learntime": 0.1991992611438036,
    "sampletime": 6.683653454994783,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 27,
    "reward_mean": -44.449549833335716,
    "reward_max": -17.82874547238603,
    "reward_min": -76.04549739938794,
    "reward_std": 14.421309428354922,
    "timesteps": 3500604,
    "learntime": 0.20435898192226887,
    "sampletime": 6.7573989981319755,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 28,
    "reward_mean": -47.40337869372617,
    "reward_max": -8.213795739395374,
    "reward_min": -84.98092117191602,
    "reward_std": 19.261669578666485,
    "timesteps": 3710733,
    "learntime": 0.14020783896557987,
    "sampletime": 6.327763136010617,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 29,
    "reward_mean": -52.374007311149555,
    "reward_max": -8.547987124315556,
    "reward_min": -94.73693626404346,
    "reward_std": 19.542515636150597,
    "timesteps": 3905619,
    "learntime": 0.1869995379820466,
    "sampletime": 5.707879065070301,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 30,
    "reward_mean": -47.844439884452626,
    "reward_max": -17.99338314646968,
    "reward_min": -84.93164482170886,
    "reward_std": 17.108700055893063,
    "timesteps": 4116171,
    "learntime": 0.14239670103415847,
    "sampletime": 6.3388183899223804,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 31,
    "reward_mean": -39.17696359531341,
    "reward_max": -7.5873968389609665,
    "reward_min": -104.33252508345653,
    "reward_std": 19.74578112019199,
    "timesteps": 4352808,
    "learntime": 0.1941578120458871,
    "sampletime": 6.673551396932453,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 32,
    "reward_mean": -40.41490456587953,
    "reward_max": 0.6760913394953734,
    "reward_min": -83.8787130974233,
    "reward_std": 19.05939557977212,
    "timesteps": 4584423,
    "learntime": 0.13952444889582694,
    "sampletime": 6.481925494037569,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 33,
    "reward_mean": -33.52666722504095,
    "reward_max": -0.14811956309454946,
    "reward_min": -65.86744315419911,
    "reward_std": 15.99516201653817,
    "timesteps": 4838892,
    "learntime": 0.1785840999800712,
    "sampletime": 6.785311562009156,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 34,
    "reward_mean": -37.0108426661061,
    "reward_max": 0.3414849525098816,
    "reward_min": -75.99715627461786,
    "reward_std": 18.140635641991107,
    "timesteps": 5082918,
    "learntime": 0.1425949081312865,
    "sampletime": 6.78934766119346,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 35,
    "reward_mean": -31.673934213079093,
    "reward_max": 0.29029221236917063,
    "reward_min": -101.35318438858359,
    "reward_std": 18.25740566354652,
    "timesteps": 5342892,
    "learntime": 0.18362047895789146,
    "sampletime": 6.8787407469935715,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 36,
    "reward_mean": -20.596387028474382,
    "reward_max": 1.4338661646549762,
    "reward_min": -51.81269219430221,
    "reward_std": 13.067138984481996,
    "timesteps": 5638923,
    "learntime": 0.14207813888788223,
    "sampletime": 7.849837624002248,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 37,
    "reward_mean": -29.4752695795391,
    "reward_max": 1.1517201887415423,
    "reward_min": -76.38338478639099,
    "reward_std": 18.64440255799288,
    "timesteps": 5904915,
    "learntime": 0.19296734407544136,
    "sampletime": 7.217592814005911,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 38,
    "reward_mean": -25.287716592062573,
    "reward_max": 1.2231071980667423,
    "reward_min": -65.99550244607256,
    "reward_std": 16.044298556242726,
    "timesteps": 6190716,
    "learntime": 0.13522583316080272,
    "sampletime": 7.639511673012748,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 39,
    "reward_mean": -11.596995678121061,
    "reward_max": 1.4222444697645376,
    "reward_min": -57.78689074206914,
    "reward_std": 10.974404566484257,
    "timesteps": 6516369,
    "learntime": 0.17648016707971692,
    "sampletime": 8.22616353398189,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 40,
    "reward_mean": -20.72170670758458,
    "reward_max": 0.8905043049440272,
    "reward_min": -75.39002646708326,
    "reward_std": 14.516262079433536,
    "timesteps": 6814203,
    "learntime": 0.14806496491655707,
    "sampletime": 7.551652794936672,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 41,
    "reward_mean": -10.651242528363127,
    "reward_max": 2.0419432839419924,
    "reward_min": -49.725032747283365,
    "reward_std": 11.753708216688016,
    "timesteps": 7145211,
    "learntime": 0.17301373998634517,
    "sampletime": 8.388878050027415,
    "best_max_mean": -10.651242528363127,
    "best_max": 2.0419432839419924
  },
  {
    "gen": 42,
    "reward_mean": -4.181951147291855,
    "reward_max": 2.2129296977331627,
    "reward_min": -27.09957153613725,
    "reward_std": 6.997478891260294,
    "timesteps": 7492026,
    "learntime": 0.15448490506969392,
    "sampletime": 8.433554123854265,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 43,
    "reward_mean": -3.8453899021074465,
    "reward_max": 2.0899661730307098,
    "reward_min": -26.780295251163114,
    "reward_std": 6.60951742207531,
    "timesteps": 7839249,
    "learntime": 0.2085859440267086,
    "sampletime": 8.501716885017231,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 44,
    "reward_mean": -2.95656072162115,
    "reward_max": 2.127227258764445,
    "reward_min": -47.55577632858927,
    "reward_std": 8.05084569620544,
    "timesteps": 8189109,
    "learntime": 0.147897575981915,
    "sampletime": 8.617220497922972,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 45,
    "reward_mean": -1.1586074313807209,
    "reward_max": 2.0507708590610254,
    "reward_min": -17.769815113776446,
    "reward_std": 4.396912618060163,
    "timesteps": 8543046,
    "learntime": 0.1874341059010476,
    "sampletime": 8.593867426970974,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 46,
    "reward_mean": 0.8758083467020369,
    "reward_max": 2.0418922907362367,
    "reward_min": -17.2220408182563,
    "reward_std": 2.5729674644354414,
    "timesteps": 8902713,
    "learntime": 0.14543829881586134,
    "sampletime": 8.725934099871665,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 47,
    "reward_mean": -2.165411959787625,
    "reward_max": 2.2421953672036925,
    "reward_min": -34.71552958687729,
    "reward_std": 6.939037190707742,
    "timesteps": 9254568,
    "learntime": 0.20420188712887466,
    "sampletime": 8.670477295992896,
    "best_max_mean": -2.165411959787625,
    "best_max": 2.2421953672036925
  },
  {
    "gen": 48,
    "reward_mean": 1.474219021535204,
    "reward_max": 2.1087811529933873,
    "reward_min": 0.03495460979885825,
    "reward_std": 0.30848162974336935,
    "timesteps": 9615288,
    "learntime": 0.14052801998332143,
    "sampletime": 8.849837864981964,
    "best_max_mean": -2.165411959787625,
    "best_max": 2.2421953672036925
  },
  {
    "gen": 49,
    "reward_mean": 1.1228624132698484,
    "reward_max": 2.065879017859007,
    "reward_min": -8.419802303835628,
    "reward_std": 1.997494343207942,
    "timesteps": 9974748,
    "learntime": 0.19931248808279634,
    "sampletime": 8.721105858916417,
    "best_max_mean": -2.165411959787625,
    "best_max": 2.2421953672036925
  },
  {
    "gen": 50,
    "reward_mean": -0.4769958233704735,
    "reward_max": 1.9337291791012026,
    "reward_min": -22.70244519318739,
    "reward_std": 4.728403407859763,
    "timesteps": 10331505,
    "learntime": 0.15311009204015136,
    "sampletime": 8.66865298198536,
    "best_max_mean": -2.165411959787625,
    "best_max": 2.2421953672036925
  },
  {
    "gen": 51,
    "reward_mean": 1.235418092813611,
    "reward_max": 2.2578653277843377,
    "reward_min": -9.383352967367198,
    "reward_std": 2.139425968504328,
    "timesteps": 10690977,
    "learntime": 0.19140025088563561,
    "sampletime": 8.817613120889291,
    "best_max_mean": 1.235418092813611,
    "best_max": 2.2578653277843377
  },
  {
    "gen": 52,
    "reward_mean": 1.06584610330267,
    "reward_max": 2.20397818291729,
    "reward_min": -7.747818761258248,
    "reward_std": 1.928172385264683,
    "timesteps": 11051067,
    "learntime": 0.14751977589912713,
    "sampletime": 8.797781035071239,
    "best_max_mean": 1.235418092813611,
    "best_max": 2.2578653277843377
  },
  {
    "gen": 53,
    "reward_mean": 0.9758177601469334,
    "reward_max": 2.205417457982106,
    "reward_min": -7.497108487066617,
    "reward_std": 2.6355445262342925,
    "timesteps": 11409255,
    "learntime": 0.21060635289177299,
    "sampletime": 8.821140242973343,
    "best_max_mean": 1.235418092813611,
    "best_max": 2.2578653277843377
  },
  {
    "gen": 54,
    "reward_mean": 0.9977810815060011,
    "reward_max": 2.140227806091195,
    "reward_min": -16.233687034666108,
    "reward_std": 3.356812948335024,
    "timesteps": 11767578,
    "learntime": 0.16157127521000803,
    "sampletime": 8.699655055999756,
    "best_max_mean": 1.235418092813611,
    "best_max": 2.2578653277843377
  },
  {
    "gen": 55,
    "reward_mean": 1.6057211638531097,
    "reward_max": 2.4207475148864543,
    "reward_min": -3.7977498569067207,
    "reward_std": 0.8803230362857044,
    "timesteps": 12128298,
    "learntime": 0.19143312913365662,
    "sampletime": 8.779784717829898,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 56,
    "reward_mean": 1.3496704086576812,
    "reward_max": 2.2051075713349166,
    "reward_min": -7.090324603982566,
    "reward_std": 1.8662554718612063,
    "timesteps": 12487875,
    "learntime": 0.1549840560182929,
    "sampletime": 8.65475765708834,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 57,
    "reward_mean": 1.8394492048340176,
    "reward_max": 2.283127114550687,
    "reward_min": 1.5234195190220774,
    "reward_std": 0.15553942276844981,
    "timesteps": 12848595,
    "learntime": 0.20076390309259295,
    "sampletime": 8.660165335051715,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 58,
    "reward_mean": 1.064805427801108,
    "reward_max": 2.252194483041282,
    "reward_min": -13.942375453885896,
    "reward_std": 2.863474234895718,
    "timesteps": 13206867,
    "learntime": 0.1470360830426216,
    "sampletime": 8.675073044141755,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 59,
    "reward_mean": 1.8398472224200517,
    "reward_max": 2.081085004746757,
    "reward_min": 1.5025827772421452,
    "reward_std": 0.126632512833579,
    "timesteps": 13567587,
    "learntime": 0.15439267782494426,
    "sampletime": 8.776057261042297,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 60,
    "reward_mean": 1.8379090197514878,
    "reward_max": 2.083551095486844,
    "reward_min": 1.539532783355549,
    "reward_std": 0.1295365428720181,
    "timesteps": 13928307,
    "learntime": 0.19695777911692858,
    "sampletime": 8.729106212966144,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 61,
    "reward_mean": 1.8196659655521907,
    "reward_max": 2.114109133888355,
    "reward_min": 1.5542171989765097,
    "reward_std": 0.1267809965767768,
    "timesteps": 14289027,
    "learntime": 0.18955138116143644,
    "sampletime": 8.735499982023612,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 62,
    "reward_mean": 1.373646314579484,
    "reward_max": 2.100014968201952,
    "reward_min": -7.289584486533636,
    "reward_std": 1.8464151240742732,
    "timesteps": 14648697,
    "learntime": 0.15478093991987407,
    "sampletime": 8.781049276003614,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 63,
    "reward_mean": 1.833711796656752,
    "reward_max": 2.1358767444387774,
    "reward_min": 1.4592537950520625,
    "reward_std": 0.15214980310383008,
    "timesteps": 15009417,
    "learntime": 0.19096525781787932,
    "sampletime": 8.800790159963071,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 64,
    "reward_mean": 1.4101507352344262,
    "reward_max": 2.1684154354134604,
    "reward_min": -15.54409994794917,
    "reward_std": 2.3912561896743174,
    "timesteps": 15368985,
    "learntime": 0.14365899399854243,
    "sampletime": 8.749338015913963,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 65,
    "reward_mean": 1.340498472521806,
    "reward_max": 2.0701214816261864,
    "reward_min": -7.711417927551367,
    "reward_std": 1.984719518272824,
    "timesteps": 15728628,
    "learntime": 0.20354533707723022,
    "sampletime": 8.70200043800287,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 66,
    "reward_mean": 1.8672699945939542,
    "reward_max": 2.2606180890607974,
    "reward_min": 1.6340927164005572,
    "reward_std": 0.11186410262587987,
    "timesteps": 16089348,
    "learntime": 0.14500724710524082,
    "sampletime": 8.940386548172683,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 67,
    "reward_mean": -1.1299414572408004,
    "reward_max": 2.2208359594153437,
    "reward_min": -61.78228093980754,
    "reward_std": 8.483548023937297,
    "timesteps": 16441077,
    "learntime": 0.20683235302567482,
    "sampletime": 8.540620350046083,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 68,
    "reward_mean": 1.7361502219121918,
    "reward_max": 2.1349470761417617,
    "reward_min": 1.1805517271312747,
    "reward_std": 0.18207160445440204,
    "timesteps": 16801797,
    "learntime": 0.15544532286003232,
    "sampletime": 8.70559643697925,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 69,
    "reward_mean": 1.7743528771293597,
    "reward_max": 2.073502242852664,
    "reward_min": 1.4803373964589817,
    "reward_std": 0.13882392350899248,
    "timesteps": 17162517,
    "learntime": 0.1870911791920662,
    "sampletime": 8.87973100389354,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 70,
    "reward_mean": 1.8131955782343556,
    "reward_max": 2.178854902402637,
    "reward_min": 1.395625891021951,
    "reward_std": 0.1448243656611982,
    "timesteps": 17523237,
    "learntime": 0.1517078848555684,
    "sampletime": 8.900635349098593,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 71,
    "reward_mean": 1.8028914600126653,
    "reward_max": 2.1804728198829126,
    "reward_min": 1.4966462738247506,
    "reward_std": 0.1527649646819695,
    "timesteps": 17883957,
    "learntime": 0.20059757796116173,
    "sampletime": 8.805786815937608,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 72,
    "reward_mean": 1.7798444314080772,
    "reward_max": 2.2209375139562195,
    "reward_min": 1.2804822554444923,
    "reward_std": 0.16140593879752588,
    "timesteps": 18244677,
    "learntime": 0.15663485904224217,
    "sampletime": 8.684157761977986,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 73,
    "reward_mean": 1.8131424829518221,
    "reward_max": 2.169663594505186,
    "reward_min": 1.4153380829798548,
    "reward_std": 0.16359699247361562,
    "timesteps": 18605397,
    "learntime": 0.1821676050312817,
    "sampletime": 8.770299046998844,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 74,
    "reward_mean": 1.7721635360733752,
    "reward_max": 2.22744338652895,
    "reward_min": 1.3434381998129956,
    "reward_std": 0.15202170306135523,
    "timesteps": 18966117,
    "learntime": 0.1466178889386356,
    "sampletime": 8.785338483052328,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 75,
    "reward_mean": 1.7833131057144005,
    "reward_max": 2.129017093834229,
    "reward_min": 1.4916072738018207,
    "reward_std": 0.1447651098977334,
    "timesteps": 19326837,
    "learntime": 0.2050601018127054,
    "sampletime": 8.777372219832614,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 76,
    "reward_mean": 1.8468159781136944,
    "reward_max": 2.2148500320116793,
    "reward_min": 1.5205648770083096,
    "reward_std": 0.1452164582558042,
    "timesteps": 19687557,
    "learntime": 0.14939052797853947,
    "sampletime": 8.789025787031278,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 77,
    "reward_mean": 1.875189914659899,
    "reward_max": 2.173421370014287,
    "reward_min": 1.5920841820382812,
    "reward_std": 0.13778882876281448,
    "timesteps": 20048277,
    "learntime": 0.18729963805526495,
    "sampletime": 8.759258867939934,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 78,
    "reward_mean": 1.858387611583331,
    "reward_max": 2.243866981488984,
    "reward_min": 1.544122258987924,
    "reward_std": 0.1430213160280324,
    "timesteps": 20408997,
    "learntime": 0.1374845369718969,
    "sampletime": 8.701202847063541,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 79,
    "reward_mean": 1.8084033523809782,
    "reward_max": 2.182752132122967,
    "reward_min": 1.439010003366449,
    "reward_std": 0.136820660385389,
    "timesteps": 20769717,
    "learntime": 0.1894079379271716,
    "sampletime": 8.805576673941687,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 80,
    "reward_mean": 1.8001204213655462,
    "reward_max": 2.133700546013915,
    "reward_min": 1.544654642522798,
    "reward_std": 0.13405386638830866,
    "timesteps": 21130437,
    "learntime": 0.1481238310225308,
    "sampletime": 8.815022290917113,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 81,
    "reward_mean": 1.7228461246781726,
    "reward_max": 2.018473058539622,
    "reward_min": 1.3979099988796226,
    "reward_std": 0.14148584713815315,
    "timesteps": 21491157,
    "learntime": 0.19784932397305965,
    "sampletime": 8.635327907977626,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 82,
    "reward_mean": 1.8058298452057588,
    "reward_max": 2.2431676187967002,
    "reward_min": 1.3525008876499147,
    "reward_std": 0.18146990432110008,
    "timesteps": 21851877,
    "learntime": 0.14780797879211605,
    "sampletime": 8.688095310004428,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 83,
    "reward_mean": 1.3624802576035977,
    "reward_max": 2.109834511918859,
    "reward_min": -7.769504370428906,
    "reward_std": 1.918145262459881,
    "timesteps": 22211367,
    "learntime": 0.19156411290168762,
    "sampletime": 8.646695016184822,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 84,
    "reward_mean": 1.7890955357205502,
    "reward_max": 2.171789818006357,
    "reward_min": 1.2798715458696004,
    "reward_std": 0.15481800086739755,
    "timesteps": 22572087,
    "learntime": 0.1534149320796132,
    "sampletime": 8.940437240060419,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 85,
    "reward_mean": 1.8134314654963024,
    "reward_max": 2.1162871697536776,
    "reward_min": 1.489877415190371,
    "reward_std": 0.1350532049259689,
    "timesteps": 22932807,
    "learntime": 0.21159828105010092,
    "sampletime": 8.75964510301128,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 86,
    "reward_mean": 1.8675373582481507,
    "reward_max": 2.258833254038383,
    "reward_min": 1.4745876679727268,
    "reward_std": 0.1678663225129436,
    "timesteps": 23293527,
    "learntime": 0.14753201301209629,
    "sampletime": 8.674761308124289,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 87,
    "reward_mean": 1.7389489847954094,
    "reward_max": 2.146414571921479,
    "reward_min": 1.4106479467309045,
    "reward_std": 0.15343912034526466,
    "timesteps": 23654247,
    "learntime": 0.19404073688201606,
    "sampletime": 8.743133696028963,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 88,
    "reward_mean": 1.4175039568593473,
    "reward_max": 2.3283660152898817,
    "reward_min": -7.296586049889976,
    "reward_std": 1.902376416847704,
    "timesteps": 24013821,
    "learntime": 0.13465973711572587,
    "sampletime": 8.860540149034932,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 89,
    "reward_mean": 1.798943645347069,
    "reward_max": 2.3486523548474163,
    "reward_min": 1.446018485987388,
    "reward_std": 0.14514749022339635,
    "timesteps": 24374541,
    "learntime": 0.18506359704770148,
    "sampletime": 8.725029754918069,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 90,
    "reward_mean": 1.8339495438901423,
    "reward_max": 2.4054319046201376,
    "reward_min": 1.465655304421845,
    "reward_std": 0.1940664020672639,
    "timesteps": 24735261,
    "learntime": 0.14117823308333755,
    "sampletime": 8.69743425399065,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 91,
    "reward_mean": 1.8387236121078456,
    "reward_max": 2.1885382484320077,
    "reward_min": 1.55346398978468,
    "reward_std": 0.14235106644414702,
    "timesteps": 25095981,
    "learntime": 0.2056937050074339,
    "sampletime": 8.875247024931014,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 92,
    "reward_mean": 1.8665838478869494,
    "reward_max": 2.245465357407792,
    "reward_min": 1.4527137431238444,
    "reward_std": 0.15815032081736524,
    "timesteps": 25456701,
    "learntime": 0.14270089101046324,
    "sampletime": 8.78485303511843,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 93,
    "reward_mean": 1.8438424855624782,
    "reward_max": 2.4353959641779146,
    "reward_min": 1.536308085814885,
    "reward_std": 0.1699529930956924,
    "timesteps": 25817421,
    "learntime": 0.19038865086622536,
    "sampletime": 8.677330201957375,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 94,
    "reward_mean": 1.8292762950906805,
    "reward_max": 2.1821598251101944,
    "reward_min": 1.5680882043035844,
    "reward_std": 0.16088479185926388,
    "timesteps": 26178141,
    "learntime": 0.1582363231573254,
    "sampletime": 8.8551590309944,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 95,
    "reward_mean": 1.8605830274404083,
    "reward_max": 2.1532385282334854,
    "reward_min": 1.5206885039870999,
    "reward_std": 0.15175691072009528,
    "timesteps": 26538861,
    "learntime": 0.1924603630322963,
    "sampletime": 8.736042844131589,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 96,
    "reward_mean": 1.3577479990887065,
    "reward_max": 2.076310939946612,
    "reward_min": -7.318889287591009,
    "reward_std": 1.8859397950611951,
    "timesteps": 26898420,
    "learntime": 0.14986629108898342,
    "sampletime": 8.857441214844584,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 97,
    "reward_mean": 1.8201028433018165,
    "reward_max": 2.131878993936078,
    "reward_min": 1.5026805244393218,
    "reward_std": 0.13349971976073355,
    "timesteps": 27259140,
    "learntime": 0.1985628551337868,
    "sampletime": 8.755630096886307,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 98,
    "reward_mean": 1.8549824600003717,
    "reward_max": 2.136833842939018,
    "reward_min": 1.5350975805336142,
    "reward_std": 0.13277104762907085,
    "timesteps": 27619860,
    "learntime": 0.1490746270865202,
    "sampletime": 8.83984268293716,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 99,
    "reward_mean": 1.8135750688300383,
    "reward_max": 2.1920612261270747,
    "reward_min": 1.387476075348921,
    "reward_std": 0.15192984733908238,
    "timesteps": 27980580,
    "learntime": 0.1996634230017662,
    "sampletime": 8.71119588194415,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 100,
    "reward_mean": 1.4044047532073505,
    "reward_max": 2.226917915287862,
    "reward_min": -6.838007699754655,
    "reward_std": 1.8205225706750456,
    "timesteps": 28340232,
    "learntime": 0.2029922059737146,
    "sampletime": 8.819083415204659,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 101,
    "reward_mean": 1.3598318627057286,
    "reward_max": 2.1721114438259956,
    "reward_min": -7.169738280922034,
    "reward_std": 1.7853568664028416,
    "timesteps": 28699707,
    "learntime": 0.15066894190385938,
    "sampletime": 8.825601983815432,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 102,
    "reward_mean": 1.8199854286871333,
    "reward_max": 2.0817132094381305,
    "reward_min": 1.5533917929543242,
    "reward_std": 0.13446122234312757,
    "timesteps": 29060427,
    "learntime": 0.15357863693498075,
    "sampletime": 8.846246052067727,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 103,
    "reward_mean": 1.8055615684179755,
    "reward_max": 2.124750659284301,
    "reward_min": 1.3458421353575274,
    "reward_std": 0.1651659445448548,
    "timesteps": 29421147,
    "learntime": 0.2038137731142342,
    "sampletime": 8.705014519160613,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 104,
    "reward_mean": 1.7910449023467274,
    "reward_max": 2.0258040348408275,
    "reward_min": 1.3622720861916802,
    "reward_std": 0.13859643003273672,
    "timesteps": 29781867,
    "learntime": 0.14839624497108161,
    "sampletime": 8.748305465094745,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 105,
    "reward_mean": 1.800558428484063,
    "reward_max": 2.2136412065337905,
    "reward_min": 1.4448020156689563,
    "reward_std": 0.14925180567402585,
    "timesteps": 30142587,
    "learntime": 0.2079443719703704,
    "sampletime": 8.839402351062745,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 106,
    "reward_mean": 1.7902239106963127,
    "reward_max": 2.089369299380585,
    "reward_min": 1.183703992828887,
    "reward_std": 0.1586830711722602,
    "timesteps": 30503307,
    "learntime": 0.14937153598293662,
    "sampletime": 8.821265157079324,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 107,
    "reward_mean": 1.8295275469751062,
    "reward_max": 2.2703465727068792,
    "reward_min": 1.4687864040930014,
    "reward_std": 0.1460255071046036,
    "timesteps": 30864027,
    "learntime": 0.18851455906406045,
    "sampletime": 8.704435253050178,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 108,
    "reward_mean": 1.8425188061994344,
    "reward_max": 2.1560485464352563,
    "reward_min": 1.441508987227056,
    "reward_std": 0.14126496038746736,
    "timesteps": 31224747,
    "learntime": 0.15591965685598552,
    "sampletime": 8.795919596916065,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 109,
    "reward_mean": 1.805019450860995,
    "reward_max": 2.118811530823057,
    "reward_min": 1.3966747252729155,
    "reward_std": 0.14767219667525436,
    "timesteps": 31585467,
    "learntime": 0.18887286190874875,
    "sampletime": 8.728283689823002,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 110,
    "reward_mean": 1.439344981347884,
    "reward_max": 2.2425230345062555,
    "reward_min": -7.218818652190476,
    "reward_std": 1.9155310110256285,
    "timesteps": 31945092,
    "learntime": 0.15288463700562716,
    "sampletime": 8.740765566006303,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 111,
    "reward_mean": 1.8465280063268383,
    "reward_max": 2.2088321682743026,
    "reward_min": 1.627031128186814,
    "reward_std": 0.13305904823492193,
    "timesteps": 32305812,
    "learntime": 0.19736192794516683,
    "sampletime": 8.731206133030355,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 112,
    "reward_mean": 1.8007712616722449,
    "reward_max": 2.131308844649921,
    "reward_min": 1.555153424796915,
    "reward_std": 0.12781357125086548,
    "timesteps": 32666532,
    "learntime": 0.15528755099512637,
    "sampletime": 8.728113572811708,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 113,
    "reward_mean": 1.8217953599032626,
    "reward_max": 2.1347633017170584,
    "reward_min": 1.3304064361833605,
    "reward_std": 0.16004004781244097,
    "timesteps": 33027252,
    "learntime": 0.2032155441120267,
    "sampletime": 8.953973370138556,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 114,
    "reward_mean": 1.4191529474335567,
    "reward_max": 2.1245686415285365,
    "reward_min": -7.080276738248252,
    "reward_std": 1.8652160750183377,
    "timesteps": 33386781,
    "learntime": 0.15486202319152653,
    "sampletime": 8.653039505006745,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 115,
    "reward_mean": 1.880896420046251,
    "reward_max": 2.2150219442233303,
    "reward_min": 1.431862945037814,
    "reward_std": 0.1492262081369713,
    "timesteps": 33747501,
    "learntime": 0.20241633406840265,
    "sampletime": 8.805198047775775,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 116,
    "reward_mean": 1.8164206625797064,
    "reward_max": 2.1748652970868076,
    "reward_min": 1.4140033409921933,
    "reward_std": 0.13546062390331495,
    "timesteps": 34108221,
    "learntime": 0.1514697619713843,
    "sampletime": 8.741126043954864,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 117,
    "reward_mean": 1.0055376375594922,
    "reward_max": 2.1854415414290416,
    "reward_min": -7.076859031777395,
    "reward_std": 2.464273481531437,
    "timesteps": 34467102,
    "learntime": 0.1872148308902979,
    "sampletime": 8.723808594048023,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 118,
    "reward_mean": 1.7717260978351637,
    "reward_max": 2.1777671850709734,
    "reward_min": 1.461604803073866,
    "reward_std": 0.1464708610418815,
    "timesteps": 34827822,
    "learntime": 0.1571102871093899,
    "sampletime": 8.584708114853129,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 119,
    "reward_mean": 1.775906827161965,
    "reward_max": 2.200581100966892,
    "reward_min": 1.5301259081117493,
    "reward_std": 0.15170622928184613,
    "timesteps": 35188542,
    "learntime": 0.19376639812253416,
    "sampletime": 8.67426804988645,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 120,
    "reward_mean": 1.8216991321540297,
    "reward_max": 2.3387817081300315,
    "reward_min": 1.5197425273686846,
    "reward_std": 0.17026673085273114,
    "timesteps": 35549262,
    "learntime": 0.159284139983356,
    "sampletime": 8.754971381044015,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 121,
    "reward_mean": 1.7389701524698882,
    "reward_max": 2.0300018433005156,
    "reward_min": 1.4098240253652963,
    "reward_std": 0.14078044756113678,
    "timesteps": 35909982,
    "learntime": 0.2164786879438907,
    "sampletime": 8.621894634095952,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 122,
    "reward_mean": 1.8385915053882966,
    "reward_max": 2.285837875607254,
    "reward_min": 1.531838098198121,
    "reward_std": 0.16964652790739046,
    "timesteps": 36270702,
    "learntime": 0.14413718087598681,
    "sampletime": 8.521492966916412,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 123,
    "reward_mean": 1.373490063151034,
    "reward_max": 2.1917737298997824,
    "reward_min": -7.358886542948756,
    "reward_std": 1.9323476965364854,
    "timesteps": 36630216,
    "learntime": 0.21160610811784863,
    "sampletime": 8.660042988834903,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 124,
    "reward_mean": 1.8229135401269443,
    "reward_max": 2.2535321145269025,
    "reward_min": 1.3464659056061794,
    "reward_std": 0.16973182749624838,
    "timesteps": 36990936,
    "learntime": 0.1528198211453855,
    "sampletime": 8.683992609847337,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 125,
    "reward_mean": 1.849392754796286,
    "reward_max": 2.335297485402954,
    "reward_min": 1.5168953725515142,
    "reward_std": 0.15140861241400058,
    "timesteps": 37351656,
    "learntime": 0.18858265317976475,
    "sampletime": 8.756440917029977,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 126,
    "reward_mean": 1.4361281384142193,
    "reward_max": 2.1859497866698225,
    "reward_min": -6.750691706809451,
    "reward_std": 1.7692782915716685,
    "timesteps": 37711152,
    "learntime": 0.1542447058018297,
    "sampletime": 8.803968272870407,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 127,
    "reward_mean": 1.8471961142723474,
    "reward_max": 2.1622984294354493,
    "reward_min": 1.4889736503263855,
    "reward_std": 0.12891509758219263,
    "timesteps": 38071872,
    "learntime": 0.1822589358780533,
    "sampletime": 8.785256410948932,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 128,
    "reward_mean": 1.8447179916833552,
    "reward_max": 2.2063662793952985,
    "reward_min": 1.4751117881987168,
    "reward_std": 0.15259274369240017,
    "timesteps": 38432592,
    "learntime": 0.15218728291802108,
    "sampletime": 8.7538019658532,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 129,
    "reward_mean": 1.7922027347952976,
    "reward_max": 2.0811891052025264,
    "reward_min": 1.5476991579282275,
    "reward_std": 0.13269520448177194,
    "timesteps": 38793312,
    "learntime": 0.19094848912209272,
    "sampletime": 8.575346086872742,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 130,
    "reward_mean": 1.7931518693347512,
    "reward_max": 2.244028211370193,
    "reward_min": 1.4736206729836367,
    "reward_std": 0.1449438352927126,
    "timesteps": 39154032,
    "learntime": 0.1579722489695996,
    "sampletime": 8.834494502982125,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 131,
    "reward_mean": 1.7707630439451578,
    "reward_max": 2.1303212661910527,
    "reward_min": 1.4038748783415105,
    "reward_std": 0.1444169755878066,
    "timesteps": 39514752,
    "learntime": 0.20818188996054232,
    "sampletime": 8.716788929887116,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 132,
    "reward_mean": 1.7862054473340097,
    "reward_max": 2.0794328896921437,
    "reward_min": 1.4718385117647053,
    "reward_std": 0.1433942118020762,
    "timesteps": 39875472,
    "learntime": 0.15005011903122067,
    "sampletime": 8.837261148961261,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 133,
    "reward_mean": 1.396112765336524,
    "reward_max": 2.1078555574993385,
    "reward_min": -7.225593523690341,
    "reward_std": 1.8608446715509206,
    "timesteps": 40235154,
    "learntime": 0.1852319419849664,
    "sampletime": 8.701386308064684,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 134,
    "reward_mean": 1.8419248241991086,
    "reward_max": 2.0382854638155536,
    "reward_min": 1.61050197012567,
    "reward_std": 0.12268399515533061,
    "timesteps": 40595874,
    "learntime": 0.15520854899659753,
    "sampletime": 8.71826554602012,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 135,
    "reward_mean": 1.775701977954959,
    "reward_max": 2.1045957732195437,
    "reward_min": 1.3033063511918008,
    "reward_std": 0.14149689885237235,
    "timesteps": 40956594,
    "learntime": 0.20796158793382347,
    "sampletime": 8.861378510016948,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 136,
    "reward_mean": 1.8048925785729417,
    "reward_max": 2.0657866028050176,
    "reward_min": 1.1496230139869785,
    "reward_std": 0.15766350867180495,
    "timesteps": 41317314,
    "learntime": 0.1475186760071665,
    "sampletime": 8.751318047987297,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 137,
    "reward_mean": 1.7751762933525654,
    "reward_max": 2.0644842351003603,
    "reward_min": 1.4031587210907162,
    "reward_std": 0.1584096341381679,
    "timesteps": 41678034,
    "learntime": 0.19781311391852796,
    "sampletime": 8.722342002904043,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 138,
    "reward_mean": 1.784280032193482,
    "reward_max": 2.295124737761037,
    "reward_min": 1.3954696832289377,
    "reward_std": 0.16871433205752479,
    "timesteps": 42038754,
    "learntime": 0.1519826811272651,
    "sampletime": 8.824902458116412,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 139,
    "reward_mean": 1.7879035264614567,
    "reward_max": 2.0722914818589624,
    "reward_min": 1.4163876529289101,
    "reward_std": 0.14743518210016962,
    "timesteps": 42399474,
    "learntime": 0.19397809286601841,
    "sampletime": 8.749079501954839,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 140,
    "reward_mean": 1.8066980332634235,
    "reward_max": 2.1623375027892022,
    "reward_min": 1.3385461158921081,
    "reward_std": 0.1673493757272423,
    "timesteps": 42760194,
    "learntime": 0.15676090703345835,
    "sampletime": 8.819690634030849,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 141,
    "reward_mean": 1.930593738766068,
    "reward_max": 2.2314051161132107,
    "reward_min": 1.6562074320862628,
    "reward_std": 0.13719826149110653,
    "timesteps": 43120914,
    "learntime": 0.16597551410086453,
    "sampletime": 8.797698057955131,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 142,
    "reward_mean": 1.812280337870279,
    "reward_max": 2.304144229313044,
    "reward_min": 1.3865188243657791,
    "reward_std": 0.15464246442822646,
    "timesteps": 43481634,
    "learntime": 0.1522117629647255,
    "sampletime": 8.750474718166515,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 143,
    "reward_mean": 1.4100071742215299,
    "reward_max": 2.20927278873701,
    "reward_min": -7.266487552406036,
    "reward_std": 1.7850084742638506,
    "timesteps": 43841154,
    "learntime": 0.1490586909931153,
    "sampletime": 8.755196850048378,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 144,
    "reward_mean": 1.813212084056762,
    "reward_max": 2.1963545659220673,
    "reward_min": 1.384708443504869,
    "reward_std": 0.15831254405844783,
    "timesteps": 44201874,
    "learntime": 0.15372668905183673,
    "sampletime": 8.706426465883851,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 145,
    "reward_mean": 1.7447219623649866,
    "reward_max": 2.105597976892371,
    "reward_min": 1.339036614972759,
    "reward_std": 0.16782338226241256,
    "timesteps": 44562594,
    "learntime": 0.1479454799555242,
    "sampletime": 8.729807222960517,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 146,
    "reward_mean": 1.81647539631136,
    "reward_max": 2.1367224395737217,
    "reward_min": 1.4211420690831273,
    "reward_std": 0.14262607660152263,
    "timesteps": 44923314,
    "learntime": 0.1590362519491464,
    "sampletime": 8.856381722958758,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 147,
    "reward_mean": 1.80448620569031,
    "reward_max": 2.2326774464348658,
    "reward_min": 1.4802137719022774,
    "reward_std": 0.15915584937565516,
    "timesteps": 45284034,
    "learntime": 0.14951410703361034,
    "sampletime": 8.860147648956627,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 148,
    "reward_mean": 1.3586959026783076,
    "reward_max": 2.307150808755648,
    "reward_min": -7.217648367592397,
    "reward_std": 1.8870853803963779,
    "timesteps": 45643593,
    "learntime": 0.1565556530840695,
    "sampletime": 8.77473449590616,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 149,
    "reward_mean": 1.7456451385345648,
    "reward_max": 2.2725174848367713,
    "reward_min": 1.2727821347705828,
    "reward_std": 0.1851092113244081,
    "timesteps": 46004313,
    "learntime": 0.15606592292897403,
    "sampletime": 8.638818790903315,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 150,
    "reward_mean": 1.3753365597756373,
    "reward_max": 2.03437508468447,
    "reward_min": -7.332755242797168,
    "reward_std": 1.883358673308476,
    "timesteps": 46363860,
    "learntime": 0.1496650909539312,
    "sampletime": 8.64689580607228,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 151,
    "reward_mean": 1.7184150739438915,
    "reward_max": 2.1862367217812158,
    "reward_min": 1.4404832661650366,
    "reward_std": 0.14673885902980138,
    "timesteps": 46724580,
    "learntime": 0.1476868458557874,
    "sampletime": 8.908757757162675,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 152,
    "reward_mean": 1.4561514125565402,
    "reward_max": 2.311653241684378,
    "reward_min": -7.310572289874089,
    "reward_std": 1.9363148937023542,
    "timesteps": 47084064,
    "learntime": 0.14759297901764512,
    "sampletime": 8.648745769169182,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 153,
    "reward_mean": 1.4706756497595639,
    "reward_max": 2.167780963224104,
    "reward_min": -7.019393686586147,
    "reward_std": 1.822297098086111,
    "timesteps": 47443665,
    "learntime": 0.15069158980622888,
    "sampletime": 8.7138663881924,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 154,
    "reward_mean": 1.768962130666477,
    "reward_max": 2.121673132053037,
    "reward_min": 1.496391346819243,
    "reward_std": 0.14183930780645343,
    "timesteps": 47804385,
    "learntime": 0.14757248992100358,
    "sampletime": 8.713814308168367,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 155,
    "reward_mean": 1.7808284233691296,
    "reward_max": 2.164449692137579,
    "reward_min": 1.3653991033141992,
    "reward_std": 0.14705033230553324,
    "timesteps": 48165105,
    "learntime": 0.14820448798127472,
    "sampletime": 8.622282891068608,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 156,
    "reward_mean": 1.8242908676837444,
    "reward_max": 2.1420392146136473,
    "reward_min": 1.2997861741512813,
    "reward_std": 0.16518073961172833,
    "timesteps": 48525825,
    "learntime": 0.15329780499450862,
    "sampletime": 8.768818024080247,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 157,
    "reward_mean": 1.8089089924937873,
    "reward_max": 2.2216031368192137,
    "reward_min": 1.5020883734299166,
    "reward_std": 0.13876427835718222,
    "timesteps": 48886545,
    "learntime": 0.15004208986647427,
    "sampletime": 8.83400811185129,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 158,
    "reward_mean": 1.8288847985877825,
    "reward_max": 2.2037483959169455,
    "reward_min": 1.3316251814972129,
    "reward_std": 0.18490642851643846,
    "timesteps": 49247265,
    "learntime": 0.15895111416466534,
    "sampletime": 8.823582197073847,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 159,
    "reward_mean": 1.8437067968493102,
    "reward_max": 2.103134929329492,
    "reward_min": 1.52851125384746,
    "reward_std": 0.1361606507260455,
    "timesteps": 49607985,
    "learntime": 0.14859098591841757,
    "sampletime": 8.943069254048169,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 160,
    "reward_mean": 1.82464729228552,
    "reward_max": 2.1831490748039784,
    "reward_min": 1.4245330864919874,
    "reward_std": 0.16987085396339557,
    "timesteps": 49968705,
    "learntime": 0.15166111197322607,
    "sampletime": 8.753994686994702,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 161,
    "reward_mean": 1.3767746615807182,
    "reward_max": 2.1834035331072883,
    "reward_min": -7.119546635884261,
    "reward_std": 1.8737834115931664,
    "timesteps": 50328261,
    "learntime": 0.15791669092141092,
    "sampletime": 8.745618392014876,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 162,
    "reward_mean": 1.7456695787635912,
    "reward_max": 2.091242304214656,
    "reward_min": 1.472778058000482,
    "reward_std": 0.13840703095030849,
    "timesteps": 50688981,
    "learntime": 0.15970694599673152,
    "sampletime": 8.77577156899497,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 163,
    "reward_mean": 1.814272975146143,
    "reward_max": 2.208903115766587,
    "reward_min": 1.4482499478617652,
    "reward_std": 0.14078033135560147,
    "timesteps": 51049701,
    "learntime": 0.15812353999353945,
    "sampletime": 8.79797385004349,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 164,
    "reward_mean": 1.38945321796791,
    "reward_max": 2.2257564013473714,
    "reward_min": -7.233096079982001,
    "reward_std": 1.8473473387762118,
    "timesteps": 51409242,
    "learntime": 0.15125611191615462,
    "sampletime": 8.814595128875226,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 165,
    "reward_mean": 1.4339745075798531,
    "reward_max": 2.1043467300196137,
    "reward_min": -7.3497854483350915,
    "reward_std": 1.8745880831640571,
    "timesteps": 51768696,
    "learntime": 0.1440056529827416,
    "sampletime": 8.718269084114581,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 166,
    "reward_mean": 1.4147149312635303,
    "reward_max": 2.13529224056401,
    "reward_min": -7.281291344054892,
    "reward_std": 1.846101229370237,
    "timesteps": 52128171,
    "learntime": 0.16029362613335252,
    "sampletime": 8.815277377143502,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 167,
    "reward_mean": 1.336050213266669,
    "reward_max": 2.1591368032955347,
    "reward_min": -7.416684472533235,
    "reward_std": 1.9401880237800702,
    "timesteps": 52487646,
    "learntime": 0.14418142288923264,
    "sampletime": 8.710663033882156,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 168,
    "reward_mean": 1.8381485013223635,
    "reward_max": 2.1862140653168085,
    "reward_min": 1.418121518142109,
    "reward_std": 0.15305138050043246,
    "timesteps": 52848366,
    "learntime": 0.15281477011740208,
    "sampletime": 8.768453099997714,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 169,
    "reward_mean": 1.795780583570839,
    "reward_max": 2.0927723826784064,
    "reward_min": 1.4450578463676516,
    "reward_std": 0.15612802049898292,
    "timesteps": 53209086,
    "learntime": 0.1518044020049274,
    "sampletime": 8.627667553024366,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 170,
    "reward_mean": 1.7976071301451144,
    "reward_max": 2.0357036503361665,
    "reward_min": 1.4919193068124095,
    "reward_std": 0.11976982975522477,
    "timesteps": 53569806,
    "learntime": 0.1468803130555898,
    "sampletime": 8.74479661998339,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 171,
    "reward_mean": 1.857412392185919,
    "reward_max": 2.3336088538778803,
    "reward_min": 1.5185861342346663,
    "reward_std": 0.16142326680787802,
    "timesteps": 53930526,
    "learntime": 0.1603388029616326,
    "sampletime": 8.769606189103797,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 172,
    "reward_mean": 1.8017639581272376,
    "reward_max": 2.0640383904489368,
    "reward_min": 1.382925763949361,
    "reward_std": 0.161203521708961,
    "timesteps": 54291246,
    "learntime": 0.1511887249071151,
    "sampletime": 8.708168264944106,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 173,
    "reward_mean": 1.3880431252154017,
    "reward_max": 2.2223448830191024,
    "reward_min": -7.253003590899013,
    "reward_std": 1.8888465290517698,
    "timesteps": 54650832,
    "learntime": 0.15839613298885524,
    "sampletime": 8.862463510828093,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 174,
    "reward_mean": 1.379675254848465,
    "reward_max": 2.230365407472059,
    "reward_min": -7.141001886062001,
    "reward_std": 1.825362870793174,
    "timesteps": 55010418,
    "learntime": 0.1553354561328888,
    "sampletime": 8.690712889889255,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 175,
    "reward_mean": 1.782194417570759,
    "reward_max": 2.085104230710484,
    "reward_min": 1.5368603137515775,
    "reward_std": 0.1214137265419355,
    "timesteps": 55371138,
    "learntime": 0.15252739982679486,
    "sampletime": 8.761955507099628,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 176,
    "reward_mean": 1.840054346538028,
    "reward_max": 2.184071595002683,
    "reward_min": 1.5060031140103183,
    "reward_std": 0.1616008345207717,
    "timesteps": 55731858,
    "learntime": 0.14946988900192082,
    "sampletime": 8.673711058916524,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 177,
    "reward_mean": 1.739214376002944,
    "reward_max": 2.0583406367381483,
    "reward_min": 1.4446914772984596,
    "reward_std": 0.11666887689826844,
    "timesteps": 56092578,
    "learntime": 0.1571498119737953,
    "sampletime": 8.8416277829092,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 178,
    "reward_mean": 0.9940473551046453,
    "reward_max": 2.20066966261815,
    "reward_min": -7.367640744792883,
    "reward_std": 2.646465515041753,
    "timesteps": 56450838,
    "learntime": 0.15686462610028684,
    "sampletime": 8.655263090040535,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 179,
    "reward_mean": 1.7488835818969448,
    "reward_max": 2.162407424777151,
    "reward_min": 1.4123363445021682,
    "reward_std": 0.16565769616457143,
    "timesteps": 56811558,
    "learntime": 0.14864171296358109,
    "sampletime": 8.765029046917334,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 180,
    "reward_mean": 1.941139313588819,
    "reward_max": 2.423711513444273,
    "reward_min": 1.198179451690078,
    "reward_std": 0.2012815913668782,
    "timesteps": 57172278,
    "learntime": 0.16091148997657,
    "sampletime": 8.976977818179876,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 181,
    "reward_mean": 1.8428971068702653,
    "reward_max": 2.1702572518124432,
    "reward_min": 1.4596220136471914,
    "reward_std": 0.15650157558651673,
    "timesteps": 57532998,
    "learntime": 0.15612245304509997,
    "sampletime": 8.78451270610094,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 182,
    "reward_mean": 1.803825875212515,
    "reward_max": 2.098548610483041,
    "reward_min": 1.465467035304753,
    "reward_std": 0.14116531485492242,
    "timesteps": 57893718,
    "learntime": 0.1544378011021763,
    "sampletime": 8.884323632111773,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 183,
    "reward_mean": 1.8247167029705886,
    "reward_max": 2.373854855255391,
    "reward_min": 1.3964388732653736,
    "reward_std": 0.18931770644398668,
    "timesteps": 58254438,
    "learntime": 0.19581977906636894,
    "sampletime": 8.77576629910618,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 184,
    "reward_mean": 1.7971552199627423,
    "reward_max": 2.092122784527921,
    "reward_min": 1.4574204492550251,
    "reward_std": 0.15515641516046177,
    "timesteps": 58615158,
    "learntime": 0.1541997028980404,
    "sampletime": 8.736565170809627,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 185,
    "reward_mean": 1.7619145150945523,
    "reward_max": 2.1345889256905712,
    "reward_min": 1.432403275961845,
    "reward_std": 0.15189598689091313,
    "timesteps": 58975878,
    "learntime": 0.1536476060282439,
    "sampletime": 8.740976042114198,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 186,
    "reward_mean": 1.7955146902146437,
    "reward_max": 2.2250617234544308,
    "reward_min": 1.327585315852154,
    "reward_std": 0.1779971580685472,
    "timesteps": 59336598,
    "learntime": 0.15043627400882542,
    "sampletime": 8.819313184125349,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 187,
    "reward_mean": 0.9643370940526369,
    "reward_max": 2.1676413180715737,
    "reward_min": -16.23306333382304,
    "reward_std": 3.090500919442468,
    "timesteps": 59694738,
    "learntime": 0.16029132599942386,
    "sampletime": 8.805167047074065,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 188,
    "reward_mean": 1.843970902629449,
    "reward_max": 2.232618503310457,
    "reward_min": 1.2024677752580637,
    "reward_std": 0.14694846383260252,
    "timesteps": 60055458,
    "learntime": 0.16106585995294154,
    "sampletime": 8.7014502750244,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 189,
    "reward_mean": 1.438626316266694,
    "reward_max": 2.1920461307163324,
    "reward_min": -7.05656140849566,
    "reward_std": 1.8787122452594043,
    "timesteps": 60415038,
    "learntime": 0.16246092086657882,
    "sampletime": 8.71437097992748,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 190,
    "reward_mean": 1.8003614040613294,
    "reward_max": 2.1307290005691617,
    "reward_min": 1.4516806826048325,
    "reward_std": 0.1430602450432688,
    "timesteps": 60775758,
    "learntime": 0.20806572400033474,
    "sampletime": 8.869582950137556,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 191,
    "reward_mean": 1.8935786640192105,
    "reward_max": 2.239351525070199,
    "reward_min": 1.4762412850913158,
    "reward_std": 0.15249481814256122,
    "timesteps": 61136478,
    "learntime": 0.15343738091178238,
    "sampletime": 8.749700112035498,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 192,
    "reward_mean": 1.8211057812223947,
    "reward_max": 2.1308118023973086,
    "reward_min": 1.407323477719202,
    "reward_std": 0.15053746497610604,
    "timesteps": 61497198,
    "learntime": 0.1954601260367781,
    "sampletime": 8.729928568005562,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 193,
    "reward_mean": 1.8136385148420868,
    "reward_max": 2.246201240916197,
    "reward_min": 1.4279015812913463,
    "reward_std": 0.15634043053514152,
    "timesteps": 61857918,
    "learntime": 0.14527664193883538,
    "sampletime": 8.724262369796634,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 194,
    "reward_mean": 1.8352354240911017,
    "reward_max": 2.170137421799481,
    "reward_min": 1.5230916516156834,
    "reward_std": 0.13548493492551916,
    "timesteps": 62218638,
    "learntime": 0.18502180790528655,
    "sampletime": 8.77363877184689,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 195,
    "reward_mean": 1.7962941283274119,
    "reward_max": 2.0462366108421848,
    "reward_min": 1.426633709333887,
    "reward_std": 0.14304229733013857,
    "timesteps": 62579358,
    "learntime": 0.15091351210139692,
    "sampletime": 8.778494267957285,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 196,
    "reward_mean": 1.8891849571059613,
    "reward_max": 2.2095627857594398,
    "reward_min": 1.5888619691152879,
    "reward_std": 0.13244648842996848,
    "timesteps": 62940078,
    "learntime": 0.19167461502365768,
    "sampletime": 8.666348210070282,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 197,
    "reward_mean": 1.8008798907012835,
    "reward_max": 2.0791545808694494,
    "reward_min": 1.4432123305812217,
    "reward_std": 0.12341858134894929,
    "timesteps": 63300798,
    "learntime": 0.15200589410960674,
    "sampletime": 8.742196486098692,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 198,
    "reward_mean": 1.8495113891358108,
    "reward_max": 2.142212590861491,
    "reward_min": 1.5779542286148445,
    "reward_std": 0.1293027805688972,
    "timesteps": 63661518,
    "learntime": 0.19466257793828845,
    "sampletime": 8.648047343129292,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 199,
    "reward_mean": 1.729832639503781,
    "reward_max": 2.0070939108898664,
    "reward_min": 1.367628741522571,
    "reward_std": 0.13839381977789564,
    "timesteps": 64022238,
    "learntime": 0.1570166361052543,
    "sampletime": 8.747585979057476,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 200,
    "reward_mean": 1.7936615234266307,
    "reward_max": 2.2368619737248827,
    "reward_min": 1.5117909162589844,
    "reward_std": 0.1463512363509587,
    "timesteps": 64382958,
    "learntime": 0.19088642508722842,
    "sampletime": 8.759143844014034,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 201,
    "reward_mean": 1.7970548136938835,
    "reward_max": 2.088431702472006,
    "reward_min": 1.5223393923220223,
    "reward_std": 0.13182592909762542,
    "timesteps": 64743678,
    "learntime": 0.11965517792850733,
    "sampletime": 8.752577401930466,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 202,
    "reward_mean": 1.8210082057407964,
    "reward_max": 2.1213621693622704,
    "reward_min": 1.286707993124074,
    "reward_std": 0.14834075912649353,
    "timesteps": 65104398,
    "learntime": 0.15753475879319012,
    "sampletime": 8.730925665935501,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 203,
    "reward_mean": 1.8824992755721925,
    "reward_max": 2.190121228214895,
    "reward_min": 1.5322229433157986,
    "reward_std": 0.14834913157334328,
    "timesteps": 65465118,
    "learntime": 0.2010931889526546,
    "sampletime": 8.725298119010404,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 204,
    "reward_mean": 1.5118467176575328,
    "reward_max": 2.312593747607684,
    "reward_min": -15.817833192477174,
    "reward_std": 2.4047607510443876,
    "timesteps": 65824659,
    "learntime": 0.17057963204570115,
    "sampletime": 8.739098265068606,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 205,
    "reward_mean": 1.8219972967676483,
    "reward_max": 2.2115239608890844,
    "reward_min": 1.4123195222152072,
    "reward_std": 0.14463140850492306,
    "timesteps": 66185379,
    "learntime": 0.20136630185879767,
    "sampletime": 8.690864586969838,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 206,
    "reward_mean": 1.8109988726480393,
    "reward_max": 2.117082428081296,
    "reward_min": 1.4749290332953051,
    "reward_std": 0.13176622508884583,
    "timesteps": 66546099,
    "learntime": 0.15546620287932456,
    "sampletime": 8.721725170966238,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 207,
    "reward_mean": 1.7930909653605012,
    "reward_max": 2.0361301999981856,
    "reward_min": 1.424054882376255,
    "reward_std": 0.1495074657238873,
    "timesteps": 66906819,
    "learntime": 0.18399953981861472,
    "sampletime": 8.731393823865801,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 208,
    "reward_mean": 1.7765636957756525,
    "reward_max": 2.263867376665022,
    "reward_min": 1.4222747506520872,
    "reward_std": 0.15876267154559331,
    "timesteps": 67267539,
    "learntime": 0.16396508808247745,
    "sampletime": 8.809377741999924,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 209,
    "reward_mean": 1.800006052862534,
    "reward_max": 2.213274839716781,
    "reward_min": 1.4300650380953965,
    "reward_std": 0.1587018300562845,
    "timesteps": 67628259,
    "learntime": 0.2035002401098609,
    "sampletime": 8.703642515931278,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 210,
    "reward_mean": 1.4442006792800355,
    "reward_max": 2.2166616543139672,
    "reward_min": -6.389626278029435,
    "reward_std": 1.6978692186445579,
    "timesteps": 67987785,
    "learntime": 0.15550969494506717,
    "sampletime": 8.670640837866813,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 211,
    "reward_mean": 1.8571361908933444,
    "reward_max": 2.5008536224010025,
    "reward_min": 1.4168670149167246,
    "reward_std": 0.18417548588837432,
    "timesteps": 68348505,
    "learntime": 0.19892331305891275,
    "sampletime": 8.74156163004227,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 212,
    "reward_mean": 1.7742812194164788,
    "reward_max": 2.0662467588783406,
    "reward_min": 1.4039031575622622,
    "reward_std": 0.15180997394648685,
    "timesteps": 68709225,
    "learntime": 0.15628118510358036,
    "sampletime": 8.790955632925034,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 213,
    "reward_mean": 1.7878241848349448,
    "reward_max": 2.1512389482918954,
    "reward_min": 1.4979766208932461,
    "reward_std": 0.13612409920164842,
    "timesteps": 69069945,
    "learntime": 0.20176049205474555,
    "sampletime": 8.826818859903142,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 214,
    "reward_mean": 1.8009985356434177,
    "reward_max": 2.138454180288435,
    "reward_min": 1.4709307801668066,
    "reward_std": 0.1458350430630285,
    "timesteps": 69430665,
    "learntime": 0.1587927839718759,
    "sampletime": 8.740763849113137,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 215,
    "reward_mean": 1.804381515841359,
    "reward_max": 2.105239201434109,
    "reward_min": 1.5170896030013485,
    "reward_std": 0.14172318259416064,
    "timesteps": 69791385,
    "learntime": 0.20169083215296268,
    "sampletime": 8.760563003830612,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 216,
    "reward_mean": 1.7971331299644318,
    "reward_max": 2.1268260571823396,
    "reward_min": 1.4459605244214084,
    "reward_std": 0.15078468860968006,
    "timesteps": 70152105,
    "learntime": 0.15516905602999032,
    "sampletime": 8.963027614168823,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 217,
    "reward_mean": 1.8374961479520833,
    "reward_max": 2.2238097263845797,
    "reward_min": 1.4415362016532292,
    "reward_std": 0.15249705550787637,
    "timesteps": 70512825,
    "learntime": 0.21660922397859395,
    "sampletime": 8.711965716909617,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 218,
    "reward_mean": 1.8301323946077694,
    "reward_max": 2.316788171530899,
    "reward_min": 1.3928435012154876,
    "reward_std": 0.1466548666497507,
    "timesteps": 70873545,
    "learntime": 0.15594293898902833,
    "sampletime": 8.713976576924324,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 219,
    "reward_mean": 1.8425919407412958,
    "reward_max": 2.3037858625290064,
    "reward_min": 1.5015549384115696,
    "reward_std": 0.1715394819132894,
    "timesteps": 71234265,
    "learntime": 0.197273873956874,
    "sampletime": 8.719471602002159,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 220,
    "reward_mean": 1.8329055517740787,
    "reward_max": 2.2128609895219338,
    "reward_min": 1.507759234924431,
    "reward_std": 0.14912174726101352,
    "timesteps": 71594985,
    "learntime": 0.15607893490232527,
    "sampletime": 8.756104255095124,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 221,
    "reward_mean": 1.811927478874959,
    "reward_max": 2.3212294674718357,
    "reward_min": 1.3863395554274587,
    "reward_std": 0.16421797879918876,
    "timesteps": 71955705,
    "learntime": 0.2211174019612372,
    "sampletime": 8.664772210875526,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 222,
    "reward_mean": 1.77288316021279,
    "reward_max": 2.222392289486542,
    "reward_min": 1.3944918010833596,
    "reward_std": 0.14838376021611627,
    "timesteps": 72316425,
    "learntime": 0.1600908429827541,
    "sampletime": 8.748189804144204,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 223,
    "reward_mean": 1.4404351551425434,
    "reward_max": 2.192269402623145,
    "reward_min": -7.133467654451541,
    "reward_std": 1.9012128052536656,
    "timesteps": 72676047,
    "learntime": 0.22217528894543648,
    "sampletime": 8.706263432977721,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 224,
    "reward_mean": 1.4352509268723224,
    "reward_max": 2.1681692001046446,
    "reward_min": -6.975107722505612,
    "reward_std": 1.8171900516913395,
    "timesteps": 73035927,
    "learntime": 0.16511188191361725,
    "sampletime": 8.757956604938954,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 225,
    "reward_mean": 1.4754693197392992,
    "reward_max": 2.374333402342418,
    "reward_min": -6.522817935490621,
    "reward_std": 1.7601159373110926,
    "timesteps": 73395558,
    "learntime": 0.20667804102413356,
    "sampletime": 8.752418123884127,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 226,
    "reward_mean": 1.830683311083722,
    "reward_max": 2.171123106219577,
    "reward_min": 1.5107280282324849,
    "reward_std": 0.13511821880465802,
    "timesteps": 73756278,
    "learntime": 0.16460992093198,
    "sampletime": 8.75863350299187,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 227,
    "reward_mean": 1.823913782919739,
    "reward_max": 2.2438724300712516,
    "reward_min": 1.4798992384281553,
    "reward_std": 0.15958756601867305,
    "timesteps": 74116998,
    "learntime": 0.18008626205846667,
    "sampletime": 8.680563106900081,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 228,
    "reward_mean": 1.3242318316595063,
    "reward_max": 2.126766646097441,
    "reward_min": -7.530450365892401,
    "reward_std": 1.950845062690502,
    "timesteps": 74476848,
    "learntime": 0.1435583580750972,
    "sampletime": 8.765413142973557,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 229,
    "reward_mean": 1.788567900310662,
    "reward_max": 2.3639010997770407,
    "reward_min": 1.3110898936151445,
    "reward_std": 0.1748287025625583,
    "timesteps": 74837568,
    "learntime": 0.194238955155015,
    "sampletime": 8.671229861909524,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 230,
    "reward_mean": 1.7806867836873856,
    "reward_max": 2.288122677919805,
    "reward_min": 1.4271478440231538,
    "reward_std": 0.14549624211679965,
    "timesteps": 75198288,
    "learntime": 0.16265805414877832,
    "sampletime": 8.59449245291762,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 231,
    "reward_mean": 1.7847229850582185,
    "reward_max": 2.0933867803480193,
    "reward_min": 1.4604989152592458,
    "reward_std": 0.151129289247205,
    "timesteps": 75559008,
    "learntime": 0.21744489390403032,
    "sampletime": 8.857967623043805,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 232,
    "reward_mean": 1.7915741839785952,
    "reward_max": 2.2461768525495724,
    "reward_min": 1.386186964499451,
    "reward_std": 0.14952094551493125,
    "timesteps": 75919728,
    "learntime": 0.16298357699997723,
    "sampletime": 8.708571441005915,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 233,
    "reward_mean": 1.8326820413111387,
    "reward_max": 2.1618043127148656,
    "reward_min": 1.474020817937948,
    "reward_std": 0.13436192268400823,
    "timesteps": 76280448,
    "learntime": 0.21086793090216815,
    "sampletime": 8.851467658067122,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 234,
    "reward_mean": 1.808357432132466,
    "reward_max": 2.2418431789256186,
    "reward_min": 1.433409873253282,
    "reward_std": 0.17223961171410007,
    "timesteps": 76641168,
    "learntime": 0.17421727697364986,
    "sampletime": 8.745793904876336,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 235,
    "reward_mean": 1.7571824232012458,
    "reward_max": 2.160232989367971,
    "reward_min": 1.353239358662075,
    "reward_std": 0.1593495641109732,
    "timesteps": 77001888,
    "learntime": 0.15635149902664125,
    "sampletime": 8.577474487945437,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 236,
    "reward_mean": 1.7875701442718968,
    "reward_max": 2.0769699571202636,
    "reward_min": 1.4372981421748199,
    "reward_std": 0.14035327643683868,
    "timesteps": 77362608,
    "learntime": 0.20547212613746524,
    "sampletime": 8.61689882306382,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 237,
    "reward_mean": 1.795078935878461,
    "reward_max": 2.0972457450733386,
    "reward_min": 1.4380526562630531,
    "reward_std": 0.13730051054087494,
    "timesteps": 77723328,
    "learntime": 0.16402982082217932,
    "sampletime": 8.60274343797937,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 238,
    "reward_mean": 1.8693440972802393,
    "reward_max": 2.315273136006326,
    "reward_min": 1.622635413696922,
    "reward_std": 0.1307480776834132,
    "timesteps": 78084048,
    "learntime": 0.20400978904217482,
    "sampletime": 8.7983878639061,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 239,
    "reward_mean": 1.8017433175453044,
    "reward_max": 2.295143403473597,
    "reward_min": 1.3826277800884157,
    "reward_std": 0.18704622482634145,
    "timesteps": 78444768,
    "learntime": 0.1603362939786166,
    "sampletime": 8.716543141985312,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 240,
    "reward_mean": 1.8436840268637056,
    "reward_max": 2.1833603916549866,
    "reward_min": 1.4181946678468684,
    "reward_std": 0.16686706346531743,
    "timesteps": 78805488,
    "learntime": 0.20743325003422797,
    "sampletime": 8.693904689978808,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 241,
    "reward_mean": 1.771714759111683,
    "reward_max": 1.983800043321079,
    "reward_min": 1.4564412240861442,
    "reward_std": 0.12629621338297506,
    "timesteps": 79166208,
    "learntime": 0.1550563459750265,
    "sampletime": 8.69014036282897,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 242,
    "reward_mean": 1.858994733838966,
    "reward_max": 2.2362663248698476,
    "reward_min": 1.373707151583703,
    "reward_std": 0.1626443064347829,
    "timesteps": 79526928,
    "learntime": 0.21306937700137496,
    "sampletime": 8.742828612914309,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 243,
    "reward_mean": 1.795040067383468,
    "reward_max": 2.085573627465317,
    "reward_min": 1.2867317700310534,
    "reward_std": 0.16034914971492373,
    "timesteps": 79887648,
    "learntime": 0.1544075170531869,
    "sampletime": 8.686706314096227,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 244,
    "reward_mean": 1.8889420597359354,
    "reward_max": 2.25391548744863,
    "reward_min": 1.5754488510719933,
    "reward_std": 0.16848884471339423,
    "timesteps": 80248368,
    "learntime": 0.20830403501167893,
    "sampletime": 8.688276204047725,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 245,
    "reward_mean": 1.8049524586971177,
    "reward_max": 2.1268959742993676,
    "reward_min": 1.439341181483485,
    "reward_std": 0.14737493293303564,
    "timesteps": 80609088,
    "learntime": 0.15056913695298135,
    "sampletime": 8.901543786982074,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 246,
    "reward_mean": 1.8548513025937297,
    "reward_max": 2.3684361524109097,
    "reward_min": 1.5364342871277237,
    "reward_std": 0.16073015096855145,
    "timesteps": 80969808,
    "learntime": 0.19950844417326152,
    "sampletime": 8.678339943988249,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 247,
    "reward_mean": 1.790945064872996,
    "reward_max": 2.0939921988174306,
    "reward_min": 1.493722614347157,
    "reward_std": 0.147217293814363,
    "timesteps": 81330528,
    "learntime": 0.1508643019478768,
    "sampletime": 8.755204237997532,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 248,
    "reward_mean": 1.76918798397426,
    "reward_max": 2.182189125778454,
    "reward_min": 1.4297864425882088,
    "reward_std": 0.17244055815493245,
    "timesteps": 81691248,
    "learntime": 0.20048861508257687,
    "sampletime": 8.65992347500287,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 249,
    "reward_mean": 1.7757892346356525,
    "reward_max": 2.2254994312110763,
    "reward_min": 1.4306042916423634,
    "reward_std": 0.15896884903232575,
    "timesteps": 82051968,
    "learntime": 0.15800403198227286,
    "sampletime": 8.694814797025174,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 250,
    "reward_mean": 1.3636236002410738,
    "reward_max": 2.0525708882616684,
    "reward_min": -7.121890552912553,
    "reward_std": 1.8573786466707305,
    "timesteps": 82411518,
    "learntime": 0.20839794189669192,
    "sampletime": 8.721216820878908,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 251,
    "reward_mean": 1.764847783898364,
    "reward_max": 2.176120047683877,
    "reward_min": 1.4676811913636285,
    "reward_std": 0.13797940479523071,
    "timesteps": 82772238,
    "learntime": 0.16054522804915905,
    "sampletime": 8.819731001043692,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 252,
    "reward_mean": 1.808566674230489,
    "reward_max": 2.2441556820174946,
    "reward_min": 1.395843884854745,
    "reward_std": 0.16035451936238396,
    "timesteps": 83132958,
    "learntime": 0.2088542990386486,
    "sampletime": 8.932033821940422,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 253,
    "reward_mean": 1.7990504917998011,
    "reward_max": 2.146488002011069,
    "reward_min": 1.490307062567973,
    "reward_std": 0.13474515523236635,
    "timesteps": 83493678,
    "learntime": 0.15863039903342724,
    "sampletime": 8.713209797162563,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 254,
    "reward_mean": 1.7832392112415811,
    "reward_max": 2.249575880950665,
    "reward_min": 1.476838157402886,
    "reward_std": 0.15377429484945437,
    "timesteps": 83854398,
    "learntime": 0.20074665010906756,
    "sampletime": 8.68286594003439,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 255,
    "reward_mean": 1.8107249948489357,
    "reward_max": 2.1557598595620298,
    "reward_min": 1.4661660118215472,
    "reward_std": 0.14063681824662472,
    "timesteps": 84215118,
    "learntime": 0.16071648988872766,
    "sampletime": 8.72435710998252,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 256,
    "reward_mean": 1.7535851893119032,
    "reward_max": 2.253267184245594,
    "reward_min": 1.4549244300561048,
    "reward_std": 0.15406554373074544,
    "timesteps": 84575838,
    "learntime": 0.21651371289044619,
    "sampletime": 8.65275832102634,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 257,
    "reward_mean": 1.772796079529246,
    "reward_max": 2.058597084371175,
    "reward_min": 1.4117709306477917,
    "reward_std": 0.13881458136298128,
    "timesteps": 84936558,
    "learntime": 0.15845749503932893,
    "sampletime": 8.670642819954082,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 258,
    "reward_mean": 1.8609553792834626,
    "reward_max": 2.303732894325741,
    "reward_min": 1.5600697874841762,
    "reward_std": 0.15151987657639435,
    "timesteps": 85297278,
    "learntime": 0.21176785393618047,
    "sampletime": 8.705386999063194,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 259,
    "reward_mean": 1.8339252404980968,
    "reward_max": 2.2661710937408652,
    "reward_min": 1.3723343453144248,
    "reward_std": 0.14469995980707845,
    "timesteps": 85657998,
    "learntime": 0.16633134498260915,
    "sampletime": 8.75371303409338,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 260,
    "reward_mean": 1.793164525474498,
    "reward_max": 2.1486918194870186,
    "reward_min": 1.3281637091598797,
    "reward_std": 0.16810548416356758,
    "timesteps": 86018718,
    "learntime": 0.20483344211243093,
    "sampletime": 8.858784712152556,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 261,
    "reward_mean": 1.7806970054074338,
    "reward_max": 2.1105469005450472,
    "reward_min": 1.5051703065647843,
    "reward_std": 0.1399526304891225,
    "timesteps": 86379438,
    "learntime": 0.1533785630017519,
    "sampletime": 8.734421819914132,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 262,
    "reward_mean": 1.8549171949294303,
    "reward_max": 2.2972583723550803,
    "reward_min": 1.5285086320205152,
    "reward_std": 0.15811388257011846,
    "timesteps": 86740158,
    "learntime": 0.19692806294187903,
    "sampletime": 8.863250631839037,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 263,
    "reward_mean": 1.8775675719260558,
    "reward_max": 2.3710778740227583,
    "reward_min": 1.585561034505986,
    "reward_std": 0.16034818967226916,
    "timesteps": 87100878,
    "learntime": 0.16144196107052267,
    "sampletime": 8.734560311073437,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 264,
    "reward_mean": 1.8197571454192505,
    "reward_max": 2.336344099892866,
    "reward_min": 1.5036185854974458,
    "reward_std": 0.15730341914998358,
    "timesteps": 87461598,
    "learntime": 0.2053714799694717,
    "sampletime": 8.671797547955066,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 265,
    "reward_mean": 0.9103517976407914,
    "reward_max": 2.09442400062493,
    "reward_min": -7.836862491768307,
    "reward_std": 2.583619083172783,
    "timesteps": 87820038,
    "learntime": 0.16351940599270165,
    "sampletime": 8.53390096500516,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 266,
    "reward_mean": 1.8026218315693865,
    "reward_max": 2.1802470174245348,
    "reward_min": 1.3316910786794092,
    "reward_std": 0.1811288919977156,
    "timesteps": 88180758,
    "learntime": 0.21529579302296042,
    "sampletime": 8.603453350020573,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 267,
    "reward_mean": 1.3974828281256018,
    "reward_max": 2.061259273519017,
    "reward_min": -7.673006397517219,
    "reward_std": 1.9972130768286238,
    "timesteps": 88540425,
    "learntime": 0.1500389559660107,
    "sampletime": 8.640820491826162,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 268,
    "reward_mean": 1.8235095112417767,
    "reward_max": 2.203539260126874,
    "reward_min": 1.4108119816792704,
    "reward_std": 0.1582901524035664,
    "timesteps": 88901145,
    "learntime": 0.20398072199895978,
    "sampletime": 8.783953384961933,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 269,
    "reward_mean": 1.7604906583214315,
    "reward_max": 2.1717418551790715,
    "reward_min": 1.363958090261965,
    "reward_std": 0.1501624726478809,
    "timesteps": 89261865,
    "learntime": 0.1635142599698156,
    "sampletime": 8.8253166989889,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 270,
    "reward_mean": 1.7557197075467967,
    "reward_max": 2.268645917085283,
    "reward_min": 1.3896972421948262,
    "reward_std": 0.16663040920461225,
    "timesteps": 89622585,
    "learntime": 0.20294459001161158,
    "sampletime": 8.754157090792432,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 271,
    "reward_mean": 1.7312582391085471,
    "reward_max": 2.108561460581381,
    "reward_min": 1.2484867052601951,
    "reward_std": 0.15970336567420992,
    "timesteps": 89983305,
    "learntime": 0.160045264987275,
    "sampletime": 8.701600055908784,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 272,
    "reward_mean": 1.4333913266342702,
    "reward_max": 2.208498814065628,
    "reward_min": -7.338473837693915,
    "reward_std": 1.8820796784388374,
    "timesteps": 90342906,
    "learntime": 0.15339718502946198,
    "sampletime": 8.750527964904904,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 273,
    "reward_mean": 1.7888719766541454,
    "reward_max": 2.3407960325128028,
    "reward_min": 1.35689864644175,
    "reward_std": 0.15329163266947335,
    "timesteps": 90703626,
    "learntime": 0.16109487996436656,
    "sampletime": 8.884442884940654,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 274,
    "reward_mean": 1.825769956238235,
    "reward_max": 2.137097630004227,
    "reward_min": 1.407984763990633,
    "reward_std": 0.15202495557902748,
    "timesteps": 91064346,
    "learntime": 0.15873058582656085,
    "sampletime": 8.72833052300848,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 275,
    "reward_mean": 1.90924868673543,
    "reward_max": 2.2621497645564914,
    "reward_min": 1.5255306838644713,
    "reward_std": 0.13544148503547235,
    "timesteps": 91425066,
    "learntime": 0.20579119911417365,
    "sampletime": 8.765960461925715,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 276,
    "reward_mean": 1.731193872484324,
    "reward_max": 2.125008021700934,
    "reward_min": 1.4593476864974917,
    "reward_std": 0.13392944393474468,
    "timesteps": 91785786,
    "learntime": 0.161645018029958,
    "sampletime": 8.758191658882424,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 277,
    "reward_mean": 1.7164231891902695,
    "reward_max": 2.039251628715479,
    "reward_min": 1.385380567663972,
    "reward_std": 0.14089005858883707,
    "timesteps": 92146506,
    "learntime": 0.20068431086838245,
    "sampletime": 8.727348111802712,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 278,
    "reward_mean": 1.8488602199546411,
    "reward_max": 2.201267297450224,
    "reward_min": 1.5034855240272422,
    "reward_std": 0.16065414463881372,
    "timesteps": 92507226,
    "learntime": 0.16040054615586996,
    "sampletime": 8.73809392284602,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 279,
    "reward_mean": 1.7837742049520746,
    "reward_max": 2.0615356023269893,
    "reward_min": 1.5063225072773265,
    "reward_std": 0.13794696017235442,
    "timesteps": 92867946,
    "learntime": 0.20684302202425897,
    "sampletime": 8.798339044908062,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 280,
    "reward_mean": 1.849439811953253,
    "reward_max": 2.240117024778471,
    "reward_min": 1.4644301908133008,
    "reward_std": 0.15725818202054717,
    "timesteps": 93228666,
    "learntime": 0.2072176500223577,
    "sampletime": 8.775764979887754,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 281,
    "reward_mean": 1.843861340656517,
    "reward_max": 2.1594567540080507,
    "reward_min": 1.492212367824485,
    "reward_std": 0.13192109505905975,
    "timesteps": 93589386,
    "learntime": 0.15877183992415667,
    "sampletime": 8.8798959760461,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 282,
    "reward_mean": 1.3442343871453364,
    "reward_max": 2.204878960249266,
    "reward_min": -8.03333967149427,
    "reward_std": 2.0771126591178266,
    "timesteps": 93948990,
    "learntime": 0.21753338701091707,
    "sampletime": 8.739559192908928,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 283,
    "reward_mean": 1.7477486010519812,
    "reward_max": 2.1346971991087114,
    "reward_min": 1.281812228608141,
    "reward_std": 0.17336497845050616,
    "timesteps": 94309710,
    "learntime": 0.15830861986614764,
    "sampletime": 8.973400726914406,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 284,
    "reward_mean": 1.7677404827364267,
    "reward_max": 2.167810184068608,
    "reward_min": 1.3480153671028345,
    "reward_std": 0.16308506475099732,
    "timesteps": 94670430,
    "learntime": 0.21403654920868576,
    "sampletime": 8.719536127988249,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 285,
    "reward_mean": 1.3658859901166627,
    "reward_max": 2.0589425296356114,
    "reward_min": -7.182654366503951,
    "reward_std": 1.872060574480305,
    "timesteps": 95030130,
    "learntime": 0.15199081902392209,
    "sampletime": 8.82671175710857,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 286,
    "reward_mean": 1.8683929468326195,
    "reward_max": 2.2437384412931127,
    "reward_min": 1.447718868686048,
    "reward_std": 0.1577977124614683,
    "timesteps": 95390850,
    "learntime": 0.19667704380117357,
    "sampletime": 8.839721662923694,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 287,
    "reward_mean": 1.8088714069938734,
    "reward_max": 2.1191133283763017,
    "reward_min": 1.3868915564140059,
    "reward_std": 0.14933570162467213,
    "timesteps": 95751570,
    "learntime": 0.16253097099252045,
    "sampletime": 8.808912015054375,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 288,
    "reward_mean": 1.791077780195291,
    "reward_max": 2.1262456777516143,
    "reward_min": 1.4547958808252575,
    "reward_std": 0.131556917135316,
    "timesteps": 96112290,
    "learntime": 0.21911987499333918,
    "sampletime": 8.672406970057636,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 289,
    "reward_mean": 1.7847033749713859,
    "reward_max": 2.2734466878887725,
    "reward_min": 1.381951862958497,
    "reward_std": 0.16635187374989785,
    "timesteps": 96473010,
    "learntime": 0.1594969481229782,
    "sampletime": 8.78192372014746,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 290,
    "reward_mean": 1.3561029756300291,
    "reward_max": 2.374852677288631,
    "reward_min": -7.606885436689484,
    "reward_std": 1.9298526999335939,
    "timesteps": 96832503,
    "learntime": 0.21473585884086788,
    "sampletime": 8.819715276826173,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 291,
    "reward_mean": 1.3962530085861309,
    "reward_max": 2.090792578935648,
    "reward_min": -7.237433234462517,
    "reward_std": 1.8957063557630864,
    "timesteps": 97192029,
    "learntime": 0.1695798800792545,
    "sampletime": 8.909360626945272,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 292,
    "reward_mean": 1.8050121910313957,
    "reward_max": 2.2215836568044085,
    "reward_min": 1.354331657773757,
    "reward_std": 0.14889291505651256,
    "timesteps": 97552749,
    "learntime": 0.22191271488554776,
    "sampletime": 8.778035192983225,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 293,
    "reward_mean": 1.7924337326823596,
    "reward_max": 2.1580716141104443,
    "reward_min": 1.4368741094058881,
    "reward_std": 0.14701399975379767,
    "timesteps": 97913469,
    "learntime": 0.16344599798321724,
    "sampletime": 8.822589519899338,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 294,
    "reward_mean": 1.8106103797850461,
    "reward_max": 2.232371363982867,
    "reward_min": 1.452422617487944,
    "reward_std": 0.1628216076617334,
    "timesteps": 98274189,
    "learntime": 0.2090340389404446,
    "sampletime": 8.80387214012444,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 295,
    "reward_mean": 1.822919917498628,
    "reward_max": 2.341755945962203,
    "reward_min": 1.5635051079281943,
    "reward_std": 0.1481446356300657,
    "timesteps": 98634909,
    "learntime": 0.16376674291677773,
    "sampletime": 8.83750723907724,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 296,
    "reward_mean": 1.8226905374899642,
    "reward_max": 2.164881212041814,
    "reward_min": 1.443218582380336,
    "reward_std": 0.14240926366818188,
    "timesteps": 98995629,
    "learntime": 0.2099146950058639,
    "sampletime": 8.813477178104222,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 297,
    "reward_mean": 1.341035582362101,
    "reward_max": 2.1032548110057205,
    "reward_min": -7.467996717923546,
    "reward_std": 1.8639055521985004,
    "timesteps": 99355083,
    "learntime": 0.16505759302526712,
    "sampletime": 8.663865493843332,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 298,
    "reward_mean": 1.378849074827383,
    "reward_max": 2.0895831735913144,
    "reward_min": -7.312044562080479,
    "reward_std": 1.8970566499159665,
    "timesteps": 99714663,
    "learntime": 0.20232052798382938,
    "sampletime": 8.876650384860113,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 299,
    "reward_mean": 1.7899827547990976,
    "reward_max": 2.044117443305256,
    "reward_min": 1.4858935056601876,
    "reward_std": 0.12632493380970655,
    "timesteps": 100075383,
    "learntime": 0.15393468318507075,
    "sampletime": 8.780485318042338,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 300,
    "reward_mean": 1.463518628627,
    "reward_max": 2.2460904575718517,
    "reward_min": -6.2320886252483545,
    "reward_std": 1.6638805136554744,
    "timesteps": 100434879,
    "learntime": 0.21030049212276936,
    "sampletime": 8.774122381117195,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 301,
    "reward_mean": 1.3818788452514454,
    "reward_max": 2.2374983945011255,
    "reward_min": -7.413532295193752,
    "reward_std": 1.8611511500309144,
    "timesteps": 100794597,
    "learntime": 0.15428110701031983,
    "sampletime": 8.661596026970074,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 302,
    "reward_mean": 0.5752814372600734,
    "reward_max": 2.178473666076156,
    "reward_min": -16.143620492867548,
    "reward_std": 3.4761241246900334,
    "timesteps": 101151768,
    "learntime": 0.19883769284933805,
    "sampletime": 8.712783666094765,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 303,
    "reward_mean": 1.3708030222959544,
    "reward_max": 2.153588949364182,
    "reward_min": -15.979263749867448,
    "reward_std": 2.464599775024891,
    "timesteps": 101511312,
    "learntime": 0.16507681692019105,
    "sampletime": 8.692944017006084,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 304,
    "reward_mean": 1.8126939788975958,
    "reward_max": 2.1432414176824435,
    "reward_min": 1.4376446398638274,
    "reward_std": 0.157910311468934,
    "timesteps": 101872032,
    "learntime": 0.21262338291853666,
    "sampletime": 8.672836285084486,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 305,
    "reward_mean": 1.8000285941331764,
    "reward_max": 2.082937351891206,
    "reward_min": 1.4618161378153152,
    "reward_std": 0.135598463447623,
    "timesteps": 102232752,
    "learntime": 0.15059821284376085,
    "sampletime": 8.703535923967138,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 306,
    "reward_mean": 1.793591977893295,
    "reward_max": 2.0952150896644297,
    "reward_min": 1.4293329153054661,
    "reward_std": 0.14007220630518658,
    "timesteps": 102593472,
    "learntime": 0.19958596490323544,
    "sampletime": 8.656712586991489,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 307,
    "reward_mean": 1.8486883286853337,
    "reward_max": 2.1516319590575406,
    "reward_min": 1.4173883330676627,
    "reward_std": 0.1457456095336566,
    "timesteps": 102954192,
    "learntime": 0.1796318970154971,
    "sampletime": 8.728555920068175,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 308,
    "reward_mean": 1.8214861327150742,
    "reward_max": 2.1544534385741283,
    "reward_min": 1.5084527878524616,
    "reward_std": 0.1353457550448442,
    "timesteps": 103314912,
    "learntime": 0.23005952592939138,
    "sampletime": 8.696834307163954,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 309,
    "reward_mean": 1.4579583643626997,
    "reward_max": 2.322651483466162,
    "reward_min": -6.4525966052606245,
    "reward_std": 1.7435164119865654,
    "timesteps": 103674531,
    "learntime": 0.16111406893469393,
    "sampletime": 8.776913261972368,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 310,
    "reward_mean": 1.8732687962466321,
    "reward_max": 2.2067097369722544,
    "reward_min": 1.587939740345587,
    "reward_std": 0.13855750751462118,
    "timesteps": 104035251,
    "learntime": 0.21597942803055048,
    "sampletime": 8.808454410172999,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 311,
    "reward_mean": 1.8036621875417351,
    "reward_max": 2.1872390364627448,
    "reward_min": 1.506919445110145,
    "reward_std": 0.11545293302394215,
    "timesteps": 104395971,
    "learntime": 0.15789102599956095,
    "sampletime": 8.703068768139929,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 312,
    "reward_mean": 1.8488645363134524,
    "reward_max": 2.1912449375411462,
    "reward_min": 1.5413742499683076,
    "reward_std": 0.13818337984430507,
    "timesteps": 104756691,
    "learntime": 0.22316734213382006,
    "sampletime": 8.811256035929546,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 313,
    "reward_mean": 1.7810927403939225,
    "reward_max": 2.0921345719576054,
    "reward_min": 1.294925840246968,
    "reward_std": 0.14801931323376513,
    "timesteps": 105117411,
    "learntime": 0.16941824997775257,
    "sampletime": 8.72421714104712,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 314,
    "reward_mean": 1.8050792599999903,
    "reward_max": 2.3381135191293905,
    "reward_min": 1.3603333525275525,
    "reward_std": 0.19138180302257832,
    "timesteps": 105478131,
    "learntime": 0.23227930394932628,
    "sampletime": 8.751793364994228,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 315,
    "reward_mean": 1.3719256124440335,
    "reward_max": 2.174738001016629,
    "reward_min": -6.726783259582149,
    "reward_std": 1.7530785854929052,
    "timesteps": 105837798,
    "learntime": 0.16002244199626148,
    "sampletime": 8.83491196995601,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 316,
    "reward_mean": 1.843603078988881,
    "reward_max": 2.280674756692529,
    "reward_min": 1.4972577681861956,
    "reward_std": 0.16055048565821833,
    "timesteps": 106198518,
    "learntime": 0.20355530991218984,
    "sampletime": 8.76130215707235,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 317,
    "reward_mean": 1.8322164490970505,
    "reward_max": 2.238796521683757,
    "reward_min": 1.4572395806381877,
    "reward_std": 0.14527311953318947,
    "timesteps": 106559238,
    "learntime": 0.16437878599390388,
    "sampletime": 8.710235279984772,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 318,
    "reward_mean": 1.8600414957328382,
    "reward_max": 2.1981052176984504,
    "reward_min": 1.606038658121232,
    "reward_std": 0.12987204545870087,
    "timesteps": 106919958,
    "learntime": 0.19774328102357686,
    "sampletime": 8.791986167896539,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 319,
    "reward_mean": 1.8267169650274342,
    "reward_max": 2.158081208937799,
    "reward_min": 1.5747599185684265,
    "reward_std": 0.12746999288871863,
    "timesteps": 107280678,
    "learntime": 0.15776388486847281,
    "sampletime": 8.871941349934787,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 320,
    "reward_mean": 1.8983809861091725,
    "reward_max": 2.2197879007408923,
    "reward_min": 1.462178990685829,
    "reward_std": 0.1637601735702608,
    "timesteps": 107641398,
    "learntime": 0.22926731104962528,
    "sampletime": 8.724393289070576,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 321,
    "reward_mean": 1.4260418118916467,
    "reward_max": 2.2193983739107863,
    "reward_min": -7.100374048100398,
    "reward_std": 1.8108589098392405,
    "timesteps": 108001116,
    "learntime": 0.15827737608924508,
    "sampletime": 8.691625791136175,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 322,
    "reward_mean": 1.8463943739267679,
    "reward_max": 2.2155673719667384,
    "reward_min": 1.4843307045891607,
    "reward_std": 0.15965186172899506,
    "timesteps": 108361836,
    "learntime": 0.21686494001187384,
    "sampletime": 8.829859293065965,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 323,
    "reward_mean": 1.795688675794087,
    "reward_max": 2.1218115299813096,
    "reward_min": 1.5775461825735042,
    "reward_std": 0.11835660008688606,
    "timesteps": 108722556,
    "learntime": 0.165066973073408,
    "sampletime": 8.79592080716975,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 324,
    "reward_mean": 1.800788596482719,
    "reward_max": 2.1942804796342497,
    "reward_min": 1.3710564106709833,
    "reward_std": 0.18199573803965846,
    "timesteps": 109083276,
    "learntime": 0.21379853086546063,
    "sampletime": 8.796657558064908,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 325,
    "reward_mean": 1.797354482148562,
    "reward_max": 2.27733017726051,
    "reward_min": 1.312105224300493,
    "reward_std": 0.19050501564828176,
    "timesteps": 109443996,
    "learntime": 0.16775729693472385,
    "sampletime": 8.719189456896856,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 326,
    "reward_mean": 1.8475037647423336,
    "reward_max": 2.209733785906184,
    "reward_min": 1.3557130900338605,
    "reward_std": 0.17321128377743533,
    "timesteps": 109804716,
    "learntime": 0.19465718721039593,
    "sampletime": 8.757315204944462,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 327,
    "reward_mean": 1.7500540690715085,
    "reward_max": 2.1853030877492974,
    "reward_min": 1.2928066765183948,
    "reward_std": 0.17968296852884447,
    "timesteps": 110165436,
    "learntime": 0.1619957429356873,
    "sampletime": 8.772441933164373,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 328,
    "reward_mean": 1.8323166682071519,
    "reward_max": 2.245910514462592,
    "reward_min": 1.4332946862348073,
    "reward_std": 0.16722675650345217,
    "timesteps": 110526156,
    "learntime": 0.20246745110489428,
    "sampletime": 8.766223010141402,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 329,
    "reward_mean": 1.7373811356165536,
    "reward_max": 2.102427733342415,
    "reward_min": 1.4200266892183895,
    "reward_std": 0.14547141901878807,
    "timesteps": 110886876,
    "learntime": 0.16034710011444986,
    "sampletime": 8.780417089117691,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 330,
    "reward_mean": 1.7533232499316114,
    "reward_max": 2.0962451136521927,
    "reward_min": 1.4927599390044397,
    "reward_std": 0.14173803525090836,
    "timesteps": 111247596,
    "learntime": 0.2115548369474709,
    "sampletime": 8.873499998124316,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 331,
    "reward_mean": 1.7523895778628853,
    "reward_max": 2.09711208981025,
    "reward_min": 1.437181190178361,
    "reward_std": 0.13022283028032394,
    "timesteps": 111608316,
    "learntime": 0.16463982313871384,
    "sampletime": 8.818752617109567,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 332,
    "reward_mean": 1.770883108495221,
    "reward_max": 2.1007038939095533,
    "reward_min": 1.3935900437927808,
    "reward_std": 0.15574446498819575,
    "timesteps": 111969036,
    "learntime": 0.20563111803494394,
    "sampletime": 8.761211237171665,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 333,
    "reward_mean": 1.8607091829350773,
    "reward_max": 2.2292422371789447,
    "reward_min": 1.5284252799765154,
    "reward_std": 0.15209170473283654,
    "timesteps": 112329756,
    "learntime": 0.17345611099153757,
    "sampletime": 8.771362054161727,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 334,
    "reward_mean": 1.7537708650976758,
    "reward_max": 2.058560087844714,
    "reward_min": 1.4077729717122756,
    "reward_std": 0.14648559432705777,
    "timesteps": 112690476,
    "learntime": 0.19911567796953022,
    "sampletime": 8.609046845929697,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 335,
    "reward_mean": 1.8318694626853138,
    "reward_max": 2.307371112513268,
    "reward_min": 1.4105009759994993,
    "reward_std": 0.15342234302026558,
    "timesteps": 113051196,
    "learntime": 0.1749155700672418,
    "sampletime": 8.61781472992152,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 336,
    "reward_mean": 1.854763269979414,
    "reward_max": 2.1162501339551634,
    "reward_min": 1.598085132841432,
    "reward_std": 0.14397448857159437,
    "timesteps": 113411916,
    "learntime": 0.21657215198501945,
    "sampletime": 8.73334185918793,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 337,
    "reward_mean": 1.7922362146621589,
    "reward_max": 2.150258961482021,
    "reward_min": 1.4207245169531983,
    "reward_std": 0.1496830144005522,
    "timesteps": 113772636,
    "learntime": 0.16578669799491763,
    "sampletime": 8.512941049877554,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 338,
    "reward_mean": 1.8056101239452063,
    "reward_max": 2.127704831409957,
    "reward_min": 1.3894881427316252,
    "reward_std": 0.15397840927947154,
    "timesteps": 114133356,
    "learntime": 0.20494893193244934,
    "sampletime": 8.795558077050373,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 339,
    "reward_mean": 1.7702522225794013,
    "reward_max": 2.152960714425495,
    "reward_min": 1.4268982262235055,
    "reward_std": 0.15713949098682145,
    "timesteps": 114494076,
    "learntime": 0.16397066111676395,
    "sampletime": 8.701301269931719,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 340,
    "reward_mean": 1.7588272073490003,
    "reward_max": 2.1151864439651185,
    "reward_min": 1.3753553296829142,
    "reward_std": 0.14592591482162154,
    "timesteps": 114854796,
    "learntime": 0.20931692700833082,
    "sampletime": 8.792131052119657,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 341,
    "reward_mean": 1.787435832078983,
    "reward_max": 2.1512203665774745,
    "reward_min": 1.3725550407314455,
    "reward_std": 0.17087255872550738,
    "timesteps": 115215516,
    "learntime": 0.16354316496290267,
    "sampletime": 8.872587837977335,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 342,
    "reward_mean": 1.7863294691984415,
    "reward_max": 2.0776615133650123,
    "reward_min": 1.5006365265728803,
    "reward_std": 0.1342194500090659,
    "timesteps": 115576236,
    "learntime": 0.19541777996346354,
    "sampletime": 8.555845476221293,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 343,
    "reward_mean": 1.8446266121791561,
    "reward_max": 2.3803342954876494,
    "reward_min": 1.5073505530211442,
    "reward_std": 0.15863706058835958,
    "timesteps": 115936956,
    "learntime": 0.16122761904262006,
    "sampletime": 8.723323477897793,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 344,
    "reward_mean": 1.845942617927944,
    "reward_max": 2.076528194048228,
    "reward_min": 1.5934687075536582,
    "reward_std": 0.1176942421187831,
    "timesteps": 116297676,
    "learntime": 0.21381675591692328,
    "sampletime": 8.75405168486759,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 345,
    "reward_mean": 1.8010891640750692,
    "reward_max": 2.239594246652104,
    "reward_min": 1.1846181470777282,
    "reward_std": 0.17639475132855179,
    "timesteps": 116658396,
    "learntime": 0.15422483417205513,
    "sampletime": 8.720621874090284,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 346,
    "reward_mean": 1.7994379023824718,
    "reward_max": 2.3028487518659477,
    "reward_min": 1.3539841144439464,
    "reward_std": 0.17769246336491587,
    "timesteps": 117019116,
    "learntime": 0.15879196603782475,
    "sampletime": 8.679544029990211,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 347,
    "reward_mean": 0.9758915791161084,
    "reward_max": 2.2879799003917864,
    "reward_min": -7.190777793454334,
    "reward_std": 2.5221658402354996,
    "timesteps": 117377604,
    "learntime": 0.1647443720139563,
    "sampletime": 8.594008776824921,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 348,
    "reward_mean": 1.0082910078214604,
    "reward_max": 2.1780389871241286,
    "reward_min": -7.210386497932524,
    "reward_std": 2.525537119383957,
    "timesteps": 117736092,
    "learntime": 0.1613240330480039,
    "sampletime": 8.812609918182716,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 349,
    "reward_mean": 1.8939671335735886,
    "reward_max": 2.226074272764586,
    "reward_min": 1.506234285243406,
    "reward_std": 0.14988503470090597,
    "timesteps": 118096812,
    "learntime": 0.16067194589413702,
    "sampletime": 8.767651204951108,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 350,
    "reward_mean": 1.8131094992689858,
    "reward_max": 2.1204958227471864,
    "reward_min": 1.5394050332474594,
    "reward_std": 0.1326861716141567,
    "timesteps": 118457532,
    "learntime": 0.16137733007781208,
    "sampletime": 8.759868169901893,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 351,
    "reward_mean": 1.8199353330605734,
    "reward_max": 2.2054760273198473,
    "reward_min": 1.2895869749417084,
    "reward_std": 0.16005151612933893,
    "timesteps": 118818252,
    "learntime": 0.1564782119821757,
    "sampletime": 8.819161269813776,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 352,
    "reward_mean": 1.8225398830972686,
    "reward_max": 2.2668144215955786,
    "reward_min": 1.4478681662938342,
    "reward_std": 0.1782585155339628,
    "timesteps": 119178972,
    "learntime": 0.20271971495822072,
    "sampletime": 8.768943215953186,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 353,
    "reward_mean": 1.863780293675303,
    "reward_max": 2.182031833868343,
    "reward_min": 1.515169928041743,
    "reward_std": 0.1459660467922118,
    "timesteps": 119539692,
    "learntime": 0.17575851315632463,
    "sampletime": 8.734035288915038,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 354,
    "reward_mean": 1.460768859129559,
    "reward_max": 2.1297781497494026,
    "reward_min": -6.546874425508029,
    "reward_std": 1.6864715845776075,
    "timesteps": 119899278,
    "learntime": 0.20995529112406075,
    "sampletime": 8.729859209153801,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 355,
    "reward_mean": 1.7991446735898393,
    "reward_max": 2.111402534369984,
    "reward_min": 1.4753808298523305,
    "reward_std": 0.14342469847254036,
    "timesteps": 120259998,
    "learntime": 0.1627577890176326,
    "sampletime": 8.735848946962506,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 356,
    "reward_mean": 1.432562890034724,
    "reward_max": 2.2375709292563504,
    "reward_min": -7.537838671354681,
    "reward_std": 1.9092691708486018,
    "timesteps": 120619506,
    "learntime": 0.21341326599940658,
    "sampletime": 8.660654231905937,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 357,
    "reward_mean": 1.8472182636344505,
    "reward_max": 2.262120691382069,
    "reward_min": 1.5521279392209664,
    "reward_std": 0.13985969272946008,
    "timesteps": 120980226,
    "learntime": 0.16760911396704614,
    "sampletime": 8.842112394049764,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 358,
    "reward_mean": 1.867671946731662,
    "reward_max": 2.223668204358543,
    "reward_min": 1.3987041251349352,
    "reward_std": 0.17047680058192485,
    "timesteps": 121340946,
    "learntime": 0.21797148906625807,
    "sampletime": 8.841429342981428,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 359,
    "reward_mean": 1.8117796885648594,
    "reward_max": 2.118051007529365,
    "reward_min": 1.2011799764480753,
    "reward_std": 0.1733212618056113,
    "timesteps": 121701666,
    "learntime": 0.1606021299958229,
    "sampletime": 8.787314076907933,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 360,
    "reward_mean": 1.7813225466398137,
    "reward_max": 2.1868273950125428,
    "reward_min": 1.426183216968305,
    "reward_std": 0.16710150414436234,
    "timesteps": 122062386,
    "learntime": 0.20281730499118567,
    "sampletime": 8.712951353052631,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 361,
    "reward_mean": 1.7205680264687462,
    "reward_max": 2.1148633135140456,
    "reward_min": 1.4087178571194665,
    "reward_std": 0.15979229134771383,
    "timesteps": 122423106,
    "learntime": 0.22512134001590312,
    "sampletime": 8.750618088059127,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 362,
    "reward_mean": 1.761568760787488,
    "reward_max": 2.1228962123015194,
    "reward_min": 1.3881150805844076,
    "reward_std": 0.1603170013524562,
    "timesteps": 122783826,
    "learntime": 0.17894036206416786,
    "sampletime": 8.84150355309248,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 363,
    "reward_mean": 1.783982885959608,
    "reward_max": 2.0944738857287994,
    "reward_min": 1.3724929772204497,
    "reward_std": 0.1562841856656657,
    "timesteps": 123144546,
    "learntime": 0.2250873630400747,
    "sampletime": 8.645218137884513,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 364,
    "reward_mean": 1.8721943919443067,
    "reward_max": 2.2811363571778513,
    "reward_min": 1.4519668630616946,
    "reward_std": 0.17513372726480536,
    "timesteps": 123505266,
    "learntime": 0.17008960503153503,
    "sampletime": 8.747954217949882,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 365,
    "reward_mean": 1.9124739778739186,
    "reward_max": 2.2841357820893076,
    "reward_min": 1.5633805451533647,
    "reward_std": 0.16709931861394847,
    "timesteps": 123865986,
    "learntime": 0.21948140510357916,
    "sampletime": 8.848481226945296,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 366,
    "reward_mean": 1.904764937075857,
    "reward_max": 2.275378459669423,
    "reward_min": 1.5606271436183954,
    "reward_std": 0.14239305024362128,
    "timesteps": 124226706,
    "learntime": 0.16865764115937054,
    "sampletime": 8.688610409153625,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 367,
    "reward_mean": 1.831955293553313,
    "reward_max": 2.1669428271142674,
    "reward_min": 1.4605173592572067,
    "reward_std": 0.14707388115919484,
    "timesteps": 124587426,
    "learntime": 0.20759590482339263,
    "sampletime": 8.78344721510075,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 368,
    "reward_mean": 1.8014616605431928,
    "reward_max": 2.0834145568369418,
    "reward_min": 1.340206241248363,
    "reward_std": 0.18813422881823885,
    "timesteps": 124948146,
    "learntime": 0.17342966911382973,
    "sampletime": 8.772248854860663,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 369,
    "reward_mean": 1.829015993936765,
    "reward_max": 2.253279673223115,
    "reward_min": 1.4725564139485898,
    "reward_std": 0.15340245633667887,
    "timesteps": 125308866,
    "learntime": 0.19467290793545544,
    "sampletime": 8.711487862979993,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 370,
    "reward_mean": 1.742466448300399,
    "reward_max": 2.07425310456363,
    "reward_min": 1.4263945200170056,
    "reward_std": 0.1430987405083343,
    "timesteps": 125669586,
    "learntime": 0.16931679798290133,
    "sampletime": 8.804234714945778,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 371,
    "reward_mean": 1.8202112120888785,
    "reward_max": 2.0464983086285105,
    "reward_min": 1.444580119171982,
    "reward_std": 0.1263455716431111,
    "timesteps": 126030306,
    "learntime": 0.19530287804082036,
    "sampletime": 8.740848663961515,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 372,
    "reward_mean": 1.8804955406514279,
    "reward_max": 2.2265063483624306,
    "reward_min": 1.5432777354197391,
    "reward_std": 0.15170481476218314,
    "timesteps": 126391026,
    "learntime": 0.15596016496419907,
    "sampletime": 8.770649624988437,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 373,
    "reward_mean": 1.4520497615019785,
    "reward_max": 2.2249731711086063,
    "reward_min": -7.2321037196406115,
    "reward_std": 1.8595277893336635,
    "timesteps": 126750567,
    "learntime": 0.20970476092770696,
    "sampletime": 8.732556307921186,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 374,
    "reward_mean": 1.4134622863643789,
    "reward_max": 2.1795177422040553,
    "reward_min": -7.072545703610754,
    "reward_std": 1.8613872238868778,
    "timesteps": 127110108,
    "learntime": 0.17574233817867935,
    "sampletime": 8.85090803494677,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 375,
    "reward_mean": 1.7894630552604984,
    "reward_max": 2.096775256378651,
    "reward_min": 1.5303550423087637,
    "reward_std": 0.12659766861218472,
    "timesteps": 127470828,
    "learntime": 0.2041915690060705,
    "sampletime": 8.72758791106753,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 376,
    "reward_mean": 1.817339320426794,
    "reward_max": 2.0527990025236944,
    "reward_min": 1.30294517086374,
    "reward_std": 0.12500516332149467,
    "timesteps": 127831548,
    "learntime": 0.16974252089858055,
    "sampletime": 8.711083978880197,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 377,
    "reward_mean": 1.7928659255222397,
    "reward_max": 2.210155609391625,
    "reward_min": 1.3882844933541478,
    "reward_std": 0.18680362796681366,
    "timesteps": 128192268,
    "learntime": 0.21928984904661775,
    "sampletime": 8.814018115168437,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 378,
    "reward_mean": 1.8087402929922687,
    "reward_max": 2.160157926408119,
    "reward_min": 1.3766564018301177,
    "reward_std": 0.17268661018820083,
    "timesteps": 128552988,
    "learntime": 0.17201179405674338,
    "sampletime": 8.728279778035358,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 379,
    "reward_mean": 1.795310737386691,
    "reward_max": 2.099672156851735,
    "reward_min": 1.5318363909221542,
    "reward_std": 0.15842459565753222,
    "timesteps": 128913708,
    "learntime": 0.21443713805638254,
    "sampletime": 8.833915903000161,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 380,
    "reward_mean": 0.5760921186143915,
    "reward_max": 2.1420115424658723,
    "reward_min": -25.697340588438127,
    "reward_std": 4.225061956167033,
    "timesteps": 129270444,
    "learntime": 0.16397564904764295,
    "sampletime": 8.84400130994618,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 381,
    "reward_mean": 1.8272133505775314,
    "reward_max": 2.2972915157936784,
    "reward_min": 1.380658861524847,
    "reward_std": 0.1730384839463788,
    "timesteps": 129631164,
    "learntime": 0.15957449795678258,
    "sampletime": 8.80631135799922,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 382,
    "reward_mean": 1.8253174892548065,
    "reward_max": 2.0672414078241332,
    "reward_min": 1.5041636893266408,
    "reward_std": 0.12373428281354633,
    "timesteps": 129991884,
    "learntime": 0.16972138499841094,
    "sampletime": 8.812695391010493,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 383,
    "reward_mean": 1.8884204629897576,
    "reward_max": 2.222984033181228,
    "reward_min": 1.4577945663575027,
    "reward_std": 0.137688730964997,
    "timesteps": 130352604,
    "learntime": 0.2119514320511371,
    "sampletime": 8.699469467857853,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 384,
    "reward_mean": 1.8155887089866896,
    "reward_max": 2.1913204751062096,
    "reward_min": 1.5264147372448233,
    "reward_std": 0.15862097485944757,
    "timesteps": 130713324,
    "learntime": 0.16182135907001793,
    "sampletime": 8.813101587118581,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 385,
    "reward_mean": 1.8505899527986531,
    "reward_max": 2.219964982801517,
    "reward_min": 1.4914445318085405,
    "reward_std": 0.1911063222550624,
    "timesteps": 131074044,
    "learntime": 0.22630114504136145,
    "sampletime": 8.707763599930331,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 386,
    "reward_mean": 1.817745023420657,
    "reward_max": 2.1148028880900984,
    "reward_min": 1.475697896414202,
    "reward_std": 0.1310578231686999,
    "timesteps": 131434764,
    "learntime": 0.16683044913224876,
    "sampletime": 8.7270131430123,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 387,
    "reward_mean": 1.2901866579310322,
    "reward_max": 2.154823141408885,
    "reward_min": -7.444319704222974,
    "reward_std": 1.9287234339804007,
    "timesteps": 131794185,
    "learntime": 0.2161350690294057,
    "sampletime": 8.883194128982723,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 388,
    "reward_mean": 0.9901346376613488,
    "reward_max": 2.0777367466062304,
    "reward_min": -7.162245667765311,
    "reward_std": 2.461296937610108,
    "timesteps": 132152688,
    "learntime": 0.17084219702519476,
    "sampletime": 8.666718750959262,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 389,
    "reward_mean": 1.399726633094629,
    "reward_max": 2.085050548098284,
    "reward_min": -7.139335543044251,
    "reward_std": 1.7873507339174768,
    "timesteps": 132512577,
    "learntime": 0.22306509991176426,
    "sampletime": 8.71561346296221,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 390,
    "reward_mean": 1.4628843062091712,
    "reward_max": 2.1624927689060276,
    "reward_min": -7.006533101464978,
    "reward_std": 1.8147184098334201,
    "timesteps": 132872223,
    "learntime": 0.16119893407449126,
    "sampletime": 8.760969836032018,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 391,
    "reward_mean": 1.8563259891122976,
    "reward_max": 2.135068274631822,
    "reward_min": 1.514265266546066,
    "reward_std": 0.14298476651460157,
    "timesteps": 133232943,
    "learntime": 0.1909356729593128,
    "sampletime": 8.805588694056496,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 392,
    "reward_mean": 1.818810460320234,
    "reward_max": 2.168199707200982,
    "reward_min": 1.5612037155290357,
    "reward_std": 0.12354702452157944,
    "timesteps": 133593663,
    "learntime": 0.1618602250237018,
    "sampletime": 8.758998737903312,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 393,
    "reward_mean": 1.351150891914859,
    "reward_max": 2.151312666030004,
    "reward_min": -7.397369703623667,
    "reward_std": 1.9144639269333181,
    "timesteps": 133953120,
    "learntime": 0.21782540995627642,
    "sampletime": 8.711091668810695,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 394,
    "reward_mean": 1.7278981408484224,
    "reward_max": 2.03454694187332,
    "reward_min": 1.4072600381182485,
    "reward_std": 0.13417219054593701,
    "timesteps": 134313840,
    "learntime": 0.17027886398136616,
    "sampletime": 8.81730158184655,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 395,
    "reward_mean": 1.7342733781894748,
    "reward_max": 2.2179270292752173,
    "reward_min": 1.4150617972481974,
    "reward_std": 0.15941715881739452,
    "timesteps": 134674560,
    "learntime": 0.19558775215409696,
    "sampletime": 8.715268487809226,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 396,
    "reward_mean": 1.799284575655439,
    "reward_max": 2.186313486379124,
    "reward_min": 1.418666644208835,
    "reward_std": 0.1901726597715692,
    "timesteps": 135035280,
    "learntime": 0.16695156996138394,
    "sampletime": 8.797102917917073,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 397,
    "reward_mean": 1.845385926277884,
    "reward_max": 2.503494267680003,
    "reward_min": 1.5216491007659971,
    "reward_std": 0.16106948761639972,
    "timesteps": 135396000,
    "learntime": 0.23194913612678647,
    "sampletime": 8.750337848905474,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 398,
    "reward_mean": 1.8359221654546027,
    "reward_max": 2.2811667253245633,
    "reward_min": 1.5117641687393162,
    "reward_std": 0.141979090381927,
    "timesteps": 135756720,
    "learntime": 0.17184712807647884,
    "sampletime": 8.722159436903894,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 399,
    "reward_mean": 1.8976004309510865,
    "reward_max": 2.227894799916407,
    "reward_min": 1.4170453275843136,
    "reward_std": 0.180009940578518,
    "timesteps": 136117440,
    "learntime": 0.217557140160352,
    "sampletime": 8.852061341051012,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 400,
    "reward_mean": 0.6039479049689145,
    "reward_max": 2.1846577663187996,
    "reward_min": -7.220863086488947,
    "reward_std": 3.0333668341023103,
    "timesteps": 136474590,
    "learntime": 0.17920216801576316,
    "sampletime": 8.634831686038524,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 401,
    "reward_mean": 1.4569492069520438,
    "reward_max": 2.3655026571003765,
    "reward_min": -7.226999125141006,
    "reward_std": 1.8661270756052515,
    "timesteps": 136834125,
    "learntime": 0.17730465019121766,
    "sampletime": 8.640101623022929,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 402,
    "reward_mean": 1.8112371043199043,
    "reward_max": 2.186609824935931,
    "reward_min": 1.4814069851418001,
    "reward_std": 0.14386399072444966,
    "timesteps": 137194845,
    "learntime": 0.16898612794466317,
    "sampletime": 8.589830992044881,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 403,
    "reward_mean": 1.7851193831647492,
    "reward_max": 2.146158099834183,
    "reward_min": 1.1871136552786479,
    "reward_std": 0.19180213681814148,
    "timesteps": 137555565,
    "learntime": 0.22114305500872433,
    "sampletime": 8.523356294026598,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 404,
    "reward_mean": 1.8296954496689328,
    "reward_max": 2.1863517035504376,
    "reward_min": 1.4520093103346865,
    "reward_std": 0.16436927775758645,
    "timesteps": 137916285,
    "learntime": 0.16664596903137863,
    "sampletime": 8.560375627828762,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 405,
    "reward_mean": 1.833768386744198,
    "reward_max": 2.202308571523503,
    "reward_min": 1.4974904477412816,
    "reward_std": 0.14116386638053943,
    "timesteps": 138277005,
    "learntime": 0.21211925707757473,
    "sampletime": 8.684806395089254,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 406,
    "reward_mean": 1.769923799992175,
    "reward_max": 2.131799937312987,
    "reward_min": 1.3857527296188161,
    "reward_std": 0.15804170316221208,
    "timesteps": 138637725,
    "learntime": 0.16354934009723365,
    "sampletime": 8.62393790204078,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 407,
    "reward_mean": 1.7808277319661578,
    "reward_max": 2.2032930035017064,
    "reward_min": 1.4415817195831808,
    "reward_std": 0.1604843948974403,
    "timesteps": 138998445,
    "learntime": 0.22137510916218162,
    "sampletime": 8.69478633417748,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 408,
    "reward_mean": 1.8061779978569912,
    "reward_max": 2.0319503160902603,
    "reward_min": 1.4552500954243528,
    "reward_std": 0.1274217298485902,
    "timesteps": 139359165,
    "learntime": 0.16663562785834074,
    "sampletime": 8.704171352088451,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 409,
    "reward_mean": 1.8443220101768767,
    "reward_max": 2.321797462963411,
    "reward_min": 1.3026377744514082,
    "reward_std": 0.17958246670992045,
    "timesteps": 139719885,
    "learntime": 0.2324876671191305,
    "sampletime": 8.667817052919418,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 410,
    "reward_mean": 1.7783507824086322,
    "reward_max": 2.162396350246676,
    "reward_min": 1.342738101717479,
    "reward_std": 0.16298572763622962,
    "timesteps": 140080605,
    "learntime": 0.17652354785241187,
    "sampletime": 8.785701069049537,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 411,
    "reward_mean": 1.844786610551032,
    "reward_max": 2.11925219884054,
    "reward_min": 1.3281840081044414,
    "reward_std": 0.17130233362883704,
    "timesteps": 140441325,
    "learntime": 0.21678240597248077,
    "sampletime": 8.783636354841292,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 412,
    "reward_mean": 1.3605384720551414,
    "reward_max": 2.113259537766376,
    "reward_min": -7.194423373619269,
    "reward_std": 1.882793236630979,
    "timesteps": 140801082,
    "learntime": 0.17774293781258166,
    "sampletime": 8.694824066013098,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 413,
    "reward_mean": 1.8186628495104993,
    "reward_max": 2.16432591166019,
    "reward_min": 1.4945902705173137,
    "reward_std": 0.16519169235544146,
    "timesteps": 141161802,
    "learntime": 0.20278609404340386,
    "sampletime": 8.732658734777942,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 414,
    "reward_mean": 1.7893433971832424,
    "reward_max": 2.0005592852698566,
    "reward_min": 1.4232279841759867,
    "reward_std": 0.1349772813308206,
    "timesteps": 141522522,
    "learntime": 0.17092473478987813,
    "sampletime": 8.770934151951224,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 415,
    "reward_mean": 1.8794174970422044,
    "reward_max": 2.240897806999837,
    "reward_min": 1.405550670192687,
    "reward_std": 0.1712357581903108,
    "timesteps": 141883242,
    "learntime": 0.16524025308899581,
    "sampletime": 8.919515087036416,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 416,
    "reward_mean": 1.829463751811387,
    "reward_max": 2.110420332196303,
    "reward_min": 1.6249072480325877,
    "reward_std": 0.11198767591508955,
    "timesteps": 142243962,
    "learntime": 0.16658917698077857,
    "sampletime": 8.87894659396261,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 417,
    "reward_mean": 1.7962556701749188,
    "reward_max": 2.172931763672647,
    "reward_min": 1.434155738025294,
    "reward_std": 0.13010916091813327,
    "timesteps": 142604682,
    "learntime": 0.1639527529478073,
    "sampletime": 8.75202156510204,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 418,
    "reward_mean": 1.7410151737650987,
    "reward_max": 2.1214882158198036,
    "reward_min": 1.4253891136278511,
    "reward_std": 0.15080946882227947,
    "timesteps": 142965402,
    "learntime": 0.16089200088754296,
    "sampletime": 8.662834236864,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 419,
    "reward_mean": 1.782528821442911,
    "reward_max": 2.021089863391047,
    "reward_min": 1.4612007014396946,
    "reward_std": 0.13146907775160047,
    "timesteps": 143326122,
    "learntime": 0.16646862984634936,
    "sampletime": 8.762555293971673,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 420,
    "reward_mean": 1.8277187444348626,
    "reward_max": 2.147830317918716,
    "reward_min": 1.508613766502642,
    "reward_std": 0.1506560240321213,
    "timesteps": 143686842,
    "learntime": 0.1646898069884628,
    "sampletime": 8.790009588003159,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 421,
    "reward_mean": 1.755006543429956,
    "reward_max": 2.1236291232203106,
    "reward_min": 1.4419820679027109,
    "reward_std": 0.1483857005991002,
    "timesteps": 144047562,
    "learntime": 0.1648139301687479,
    "sampletime": 8.661266586044803,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 422,
    "reward_mean": 1.8624645588332025,
    "reward_max": 2.222539048382631,
    "reward_min": 1.533981579017231,
    "reward_std": 0.15110213003847117,
    "timesteps": 144408282,
    "learntime": 0.16734644793905318,
    "sampletime": 8.633513235952705,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 423,
    "reward_mean": 1.847177751256784,
    "reward_max": 2.2157677466395467,
    "reward_min": 1.522253973721736,
    "reward_std": 0.15513008288181387,
    "timesteps": 144769002,
    "learntime": 0.16933607612736523,
    "sampletime": 8.809364314889535,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 424,
    "reward_mean": 1.7762755110146613,
    "reward_max": 2.2386156987243613,
    "reward_min": 1.2049577680264691,
    "reward_std": 0.18978704898351223,
    "timesteps": 145129722,
    "learntime": 0.16871297406032681,
    "sampletime": 8.7497564710211,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 425,
    "reward_mean": 1.8555408224517724,
    "reward_max": 2.181295016777259,
    "reward_min": 1.4694875556775076,
    "reward_std": 0.16808803189254456,
    "timesteps": 145490442,
    "learntime": 0.16399450809694827,
    "sampletime": 8.735508639132604,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 426,
    "reward_mean": 1.8521250227000987,
    "reward_max": 2.1571240183777367,
    "reward_min": 1.5131672935165192,
    "reward_std": 0.14645033056229811,
    "timesteps": 145851162,
    "learntime": 0.17025130498223007,
    "sampletime": 8.695208193035796,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 427,
    "reward_mean": 1.866130123109964,
    "reward_max": 2.302741811233288,
    "reward_min": 1.5535513500993432,
    "reward_std": 0.15725985092867498,
    "timesteps": 146211882,
    "learntime": 0.1749550038948655,
    "sampletime": 8.762592500075698,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 428,
    "reward_mean": 1.7971112041038593,
    "reward_max": 2.142255315498471,
    "reward_min": 1.4403002434733507,
    "reward_std": 0.1549753277790252,
    "timesteps": 146572602,
    "learntime": 0.1647357300389558,
    "sampletime": 8.738606922794133,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 429,
    "reward_mean": 1.8497783876690206,
    "reward_max": 2.226837525800375,
    "reward_min": 1.5750543901101766,
    "reward_std": 0.16390517884492545,
    "timesteps": 146933322,
    "learntime": 0.17264847713522613,
    "sampletime": 8.666494393954054,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 430,
    "reward_mean": 1.872093041626593,
    "reward_max": 2.317426286483442,
    "reward_min": 1.5571822957682515,
    "reward_std": 0.15281290330728933,
    "timesteps": 147294042,
    "learntime": 0.17673823190853,
    "sampletime": 8.70718118804507,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 431,
    "reward_mean": 1.8289397245132808,
    "reward_max": 2.205286923078042,
    "reward_min": 1.5010370251468623,
    "reward_std": 0.16051899628308264,
    "timesteps": 147654762,
    "learntime": 0.15810711402446032,
    "sampletime": 8.730247049825266,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 432,
    "reward_mean": 1.8711866384404585,
    "reward_max": 2.2510371413566923,
    "reward_min": 1.4369284561072333,
    "reward_std": 0.1732600866093032,
    "timesteps": 148015482,
    "learntime": 0.1637433839496225,
    "sampletime": 8.809035506099463,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 433,
    "reward_mean": 1.7867094775281818,
    "reward_max": 2.1785092632120926,
    "reward_min": 1.476760571427416,
    "reward_std": 0.14683615777311934,
    "timesteps": 148376202,
    "learntime": 0.16852485784329474,
    "sampletime": 8.890860548010096,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 434,
    "reward_mean": 1.8261964776135855,
    "reward_max": 2.3477151255744193,
    "reward_min": 1.5279115713624778,
    "reward_std": 0.1589688097384529,
    "timesteps": 148736922,
    "learntime": 0.173679563915357,
    "sampletime": 8.69356449181214,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 435,
    "reward_mean": 1.7653748198524202,
    "reward_max": 2.165909728630341,
    "reward_min": 1.3950616341352335,
    "reward_std": 0.15410109357423996,
    "timesteps": 149097642,
    "learntime": 0.17269088397733867,
    "sampletime": 8.719076342880726,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 436,
    "reward_mean": 1.7881861486271549,
    "reward_max": 2.2509345725411523,
    "reward_min": 1.2331937866878078,
    "reward_std": 0.1956785056236981,
    "timesteps": 149458362,
    "learntime": 0.17155513097532094,
    "sampletime": 8.818192754872143,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 437,
    "reward_mean": 1.8113454364828763,
    "reward_max": 2.174659888695004,
    "reward_min": 1.2666922276539732,
    "reward_std": 0.170456147351529,
    "timesteps": 149819082,
    "learntime": 0.17365645803511143,
    "sampletime": 8.770493020070717,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 438,
    "reward_mean": 1.4131405091184137,
    "reward_max": 2.0814164894364864,
    "reward_min": -7.285266829319441,
    "reward_std": 1.870810368185366,
    "timesteps": 150178593,
    "learntime": 0.16994330193847418,
    "sampletime": 8.731889319140464,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 439,
    "reward_mean": 1.8929549441947116,
    "reward_max": 2.2626836302968267,
    "reward_min": 1.6027226767247242,
    "reward_std": 0.1399468920275531,
    "timesteps": 150539313,
    "learntime": 0.16984653007239103,
    "sampletime": 8.61987942783162,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 440,
    "reward_mean": 1.9020006724201481,
    "reward_max": 2.3753767007799578,
    "reward_min": 1.3194026875681812,
    "reward_std": 0.19048425488368328,
    "timesteps": 150900033,
    "learntime": 0.18130766414105892,
    "sampletime": 8.80840286705643,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 441,
    "reward_mean": 1.4849950008037602,
    "reward_max": 2.2187254432808685,
    "reward_min": -7.280568367891567,
    "reward_std": 1.9244100142020857,
    "timesteps": 151259604,
    "learntime": 0.16785241314209998,
    "sampletime": 8.74254954396747,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 442,
    "reward_mean": 1.8501454952949046,
    "reward_max": 2.2556150463466147,
    "reward_min": 1.3105344706952242,
    "reward_std": 0.17749088998049148,
    "timesteps": 151620324,
    "learntime": 0.17944832099601626,
    "sampletime": 8.806379484012723,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 443,
    "reward_mean": 1.864146881946933,
    "reward_max": 2.082124603503013,
    "reward_min": 1.447587755662176,
    "reward_std": 0.14072331848952688,
    "timesteps": 151981044,
    "learntime": 0.16890698205679655,
    "sampletime": 8.707549911923707,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 444,
    "reward_mean": 1.8423409959054475,
    "reward_max": 2.212582454985361,
    "reward_min": 1.386766776170007,
    "reward_std": 0.16530683631441592,
    "timesteps": 152341764,
    "learntime": 0.16606171685270965,
    "sampletime": 8.641173586947843,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 445,
    "reward_mean": 1.790307146459083,
    "reward_max": 2.076829809029619,
    "reward_min": 1.3682772789810143,
    "reward_std": 0.1644801626298901,
    "timesteps": 152702484,
    "learntime": 0.17408011388033628,
    "sampletime": 8.843464984092861,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 446,
    "reward_mean": 1.781567138599293,
    "reward_max": 2.114509806947103,
    "reward_min": 1.308658814361972,
    "reward_std": 0.16320672973994313,
    "timesteps": 153063204,
    "learntime": 0.17227549012750387,
    "sampletime": 8.73781365621835,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 447,
    "reward_mean": 1.810226477178977,
    "reward_max": 2.178045743829427,
    "reward_min": 1.3721027796577348,
    "reward_std": 0.16083716801489392,
    "timesteps": 153423924,
    "learntime": 0.18555645504966378,
    "sampletime": 8.716636058874428,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 448,
    "reward_mean": 1.022491491262127,
    "reward_max": 2.166695783421648,
    "reward_min": -7.033135375325485,
    "reward_std": 2.535706360021324,
    "timesteps": 153782982,
    "learntime": 0.1679472280666232,
    "sampletime": 8.720434563001618,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 449,
    "reward_mean": 1.910742350295823,
    "reward_max": 2.212636674995968,
    "reward_min": 1.530971326489328,
    "reward_std": 0.1591152284843806,
    "timesteps": 154143702,
    "learntime": 0.1667614399921149,
    "sampletime": 8.699967582011595,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 450,
    "reward_mean": 1.8662084873973113,
    "reward_max": 2.2434981084661536,
    "reward_min": 1.574975491051601,
    "reward_std": 0.15669697689675485,
    "timesteps": 154504422,
    "learntime": 0.17194460914470255,
    "sampletime": 8.796318539883941,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 451,
    "reward_mean": 1.8329230728041779,
    "reward_max": 2.088168111225856,
    "reward_min": 1.381697573632027,
    "reward_std": 0.15107439383509186,
    "timesteps": 154865142,
    "learntime": 0.16826434317044914,
    "sampletime": 8.564095067093149,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 452,
    "reward_mean": 1.7852983360329882,
    "reward_max": 2.201495363964399,
    "reward_min": 1.4630836253539472,
    "reward_std": 0.13261291797244348,
    "timesteps": 155225862,
    "learntime": 0.1685878320131451,
    "sampletime": 8.682539698900655,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 453,
    "reward_mean": 1.9176999853449979,
    "reward_max": 2.3329601526387327,
    "reward_min": 1.500720221595129,
    "reward_std": 0.1560944087253897,
    "timesteps": 155586582,
    "learntime": 0.17027287813834846,
    "sampletime": 8.753126295981929,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 454,
    "reward_mean": 1.806913260779437,
    "reward_max": 2.2671307257595306,
    "reward_min": 1.4146398764516361,
    "reward_std": 0.15842235636089386,
    "timesteps": 155947302,
    "learntime": 0.16637853905558586,
    "sampletime": 8.67251784610562,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 455,
    "reward_mean": 1.4592896592256541,
    "reward_max": 2.0969431459706134,
    "reward_min": -6.507071532978446,
    "reward_std": 1.7079880427328924,
    "timesteps": 156306945,
    "learntime": 0.16779437894001603,
    "sampletime": 8.67249473114498,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 456,
    "reward_mean": 1.476124101622628,
    "reward_max": 2.387127041809654,
    "reward_min": -7.269642911305493,
    "reward_std": 1.852821147718437,
    "timesteps": 156666588,
    "learntime": 0.17117068287916481,
    "sampletime": 8.505486287875101,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 457,
    "reward_mean": 1.8431520182958512,
    "reward_max": 2.2010795193491477,
    "reward_min": 1.574708013329652,
    "reward_std": 0.12788731112614368,
    "timesteps": 157027308,
    "learntime": 0.16151542984880507,
    "sampletime": 8.664065137971193,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 458,
    "reward_mean": 1.749632339448731,
    "reward_max": 2.1635510990921745,
    "reward_min": 1.4244045558708316,
    "reward_std": 0.16741876218039364,
    "timesteps": 157388028,
    "learntime": 0.1902259278576821,
    "sampletime": 8.73340766900219,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 459,
    "reward_mean": 1.7428420730429925,
    "reward_max": 2.050616254684315,
    "reward_min": 1.433953411531434,
    "reward_std": 0.1474344573658999,
    "timesteps": 157748748,
    "learntime": 0.20081128389574587,
    "sampletime": 8.850378442090005,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 460,
    "reward_mean": 1.7896104905219028,
    "reward_max": 2.111802679428805,
    "reward_min": 1.4607581941368546,
    "reward_std": 0.13276236387063706,
    "timesteps": 158109468,
    "learntime": 0.16919730487279594,
    "sampletime": 8.743230564054102,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 461,
    "reward_mean": 1.4097021197821433,
    "reward_max": 2.1056022373368504,
    "reward_min": -7.503513376637731,
    "reward_std": 1.9127744819166772,
    "timesteps": 158468988,
    "learntime": 0.21439070999622345,
    "sampletime": 8.919841998023912,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 462,
    "reward_mean": 1.778207541638975,
    "reward_max": 2.1376220862430517,
    "reward_min": 1.498562401446342,
    "reward_std": 0.1397409378577121,
    "timesteps": 158829708,
    "learntime": 0.21181171503849328,
    "sampletime": 8.612094945041463,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 463,
    "reward_mean": 1.8188944253771548,
    "reward_max": 2.1859164626882586,
    "reward_min": 1.2764960576243898,
    "reward_std": 0.16235409315222102,
    "timesteps": 159190428,
    "learntime": 0.17879757191985846,
    "sampletime": 8.741591935046017,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 464,
    "reward_mean": 1.8275005535324242,
    "reward_max": 2.2510932245527813,
    "reward_min": 1.4414694875471663,
    "reward_std": 0.17832275942769216,
    "timesteps": 159551148,
    "learntime": 0.22697005583904684,
    "sampletime": 8.856296255951747,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 465,
    "reward_mean": 1.3667356814374885,
    "reward_max": 2.2085381346979456,
    "reward_min": -15.903266705064611,
    "reward_std": 2.3970690602836187,
    "timesteps": 159910911,
    "learntime": 0.16695998888462782,
    "sampletime": 8.701088650152087,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 466,
    "reward_mean": 1.8168252235084017,
    "reward_max": 2.13625103998823,
    "reward_min": 1.4140107380790679,
    "reward_std": 0.12599998633219522,
    "timesteps": 160271631,
    "learntime": 0.23150730109773576,
    "sampletime": 8.96974998083897,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 467,
    "reward_mean": 1.7955566990722156,
    "reward_max": 2.109736104252407,
    "reward_min": 1.5434424369284665,
    "reward_std": 0.1368372733184981,
    "timesteps": 160632351,
    "learntime": 0.17560757813043892,
    "sampletime": 8.726537087000906,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 468,
    "reward_mean": 1.8293504842551378,
    "reward_max": 2.10118275741878,
    "reward_min": 1.544750219493198,
    "reward_std": 0.13719382710833938,
    "timesteps": 160993071,
    "learntime": 0.23474050499498844,
    "sampletime": 8.831426067976281,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 469,
    "reward_mean": 1.8778770609380238,
    "reward_max": 2.3162890974181747,
    "reward_min": 1.623021091822725,
    "reward_std": 0.1498032398769382,
    "timesteps": 161353791,
    "learntime": 0.1701372591778636,
    "sampletime": 8.890666929073632,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 470,
    "reward_mean": 1.4016746155533955,
    "reward_max": 2.104175203436169,
    "reward_min": -7.473362346154653,
    "reward_std": 1.873024801088861,
    "timesteps": 161713206,
    "learntime": 0.22111701592803001,
    "sampletime": 8.682390681002289,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 471,
    "reward_mean": 1.782512046509003,
    "reward_max": 2.110082622303292,
    "reward_min": 1.4295693035519668,
    "reward_std": 0.14038393326305404,
    "timesteps": 162073926,
    "learntime": 0.1751333058346063,
    "sampletime": 8.696104569127783,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 472,
    "reward_mean": 1.8520899521489977,
    "reward_max": 2.2463380673976943,
    "reward_min": 1.4995180649778097,
    "reward_std": 0.14833830128109535,
    "timesteps": 162434646,
    "learntime": 0.21563770109787583,
    "sampletime": 8.77022772305645,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 473,
    "reward_mean": 1.401428019675265,
    "reward_max": 2.203326963789546,
    "reward_min": -7.223873628966623,
    "reward_std": 1.8146264335642541,
    "timesteps": 162794283,
    "learntime": 0.18605570797808468,
    "sampletime": 8.830448266118765,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 474,
    "reward_mean": 1.8250116830621081,
    "reward_max": 2.233803696535888,
    "reward_min": 1.4864779343751577,
    "reward_std": 0.14055470933200367,
    "timesteps": 163155003,
    "learntime": 0.2313830649945885,
    "sampletime": 8.77417890005745,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 475,
    "reward_mean": 1.85322679508341,
    "reward_max": 2.121467697545248,
    "reward_min": 1.4528382957285013,
    "reward_std": 0.147042080301814,
    "timesteps": 163515723,
    "learntime": 0.16274853493086994,
    "sampletime": 8.697277930099517,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 476,
    "reward_mean": 1.9211431174990588,
    "reward_max": 2.2423829510161215,
    "reward_min": 1.5954464781812419,
    "reward_std": 0.15358195971210511,
    "timesteps": 163876443,
    "learntime": 0.19747875910252333,
    "sampletime": 8.708078525960445,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 477,
    "reward_mean": 1.8696755680294357,
    "reward_max": 2.286012944377335,
    "reward_min": 1.5007142786776184,
    "reward_std": 0.16694269800381908,
    "timesteps": 164237163,
    "learntime": 0.1733661349862814,
    "sampletime": 8.728887737030163,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 478,
    "reward_mean": 1.8281700456012497,
    "reward_max": 2.210022566976309,
    "reward_min": 1.4159469675579712,
    "reward_std": 0.1558844893687174,
    "timesteps": 164597883,
    "learntime": 0.22029344690963626,
    "sampletime": 8.823326873825863,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 479,
    "reward_mean": 1.810080919247025,
    "reward_max": 2.227132198155029,
    "reward_min": 1.4872394617308244,
    "reward_std": 0.15340233483598065,
    "timesteps": 164958603,
    "learntime": 0.17541379085741937,
    "sampletime": 8.74231605278328,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 480,
    "reward_mean": 1.8511791737161771,
    "reward_max": 2.290092264309128,
    "reward_min": 1.475635596829102,
    "reward_std": 0.14201549119920023,
    "timesteps": 165319323,
    "learntime": 0.21436378499493003,
    "sampletime": 8.772457068087533,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 481,
    "reward_mean": 1.8280128215431666,
    "reward_max": 2.1808516951701162,
    "reward_min": 1.4684517388639913,
    "reward_std": 0.152729713338867,
    "timesteps": 165680043,
    "learntime": 0.1718829469755292,
    "sampletime": 8.719450935022905,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 482,
    "reward_mean": 1.8843841867893,
    "reward_max": 2.1670886905786637,
    "reward_min": 1.6544579121885652,
    "reward_std": 0.11457614541889387,
    "timesteps": 166040763,
    "learntime": 0.20448394096456468,
    "sampletime": 8.794986818917096,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 483,
    "reward_mean": 1.7978700031003254,
    "reward_max": 2.1748136166865533,
    "reward_min": 1.3546638840590735,
    "reward_std": 0.15752044448569064,
    "timesteps": 166401483,
    "learntime": 0.1743646669201553,
    "sampletime": 8.846852086950094,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 484,
    "reward_mean": 1.7570654181795993,
    "reward_max": 2.13420245845301,
    "reward_min": 1.4691390946981917,
    "reward_std": 0.1420261557847097,
    "timesteps": 166762203,
    "learntime": 0.2268924207892269,
    "sampletime": 8.831763641908765,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 485,
    "reward_mean": 1.8488415417684907,
    "reward_max": 2.301179449939145,
    "reward_min": 1.3695862981857658,
    "reward_std": 0.19247410409665436,
    "timesteps": 167122923,
    "learntime": 0.16692410106770694,
    "sampletime": 8.72636600304395,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 486,
    "reward_mean": 1.7868766193703878,
    "reward_max": 2.069314354320843,
    "reward_min": 1.4561059711588415,
    "reward_std": 0.15283999752122454,
    "timesteps": 167483643,
    "learntime": 0.23193060513585806,
    "sampletime": 8.826759319053963,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 487,
    "reward_mean": 1.8164716932284304,
    "reward_max": 2.3001071137171487,
    "reward_min": 1.4376345995697168,
    "reward_std": 0.17539414836581146,
    "timesteps": 167844363,
    "learntime": 0.17419117991812527,
    "sampletime": 8.844866888830438,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 488,
    "reward_mean": 1.8668974017899107,
    "reward_max": 2.1360869117973693,
    "reward_min": 1.5700874266807303,
    "reward_std": 0.1404919088027862,
    "timesteps": 168205083,
    "learntime": 0.21665384387597442,
    "sampletime": 8.843105875886977,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 489,
    "reward_mean": 1.8021289093602748,
    "reward_max": 2.1223643366313545,
    "reward_min": 1.4137340645062368,
    "reward_std": 0.15778417611764836,
    "timesteps": 168565803,
    "learntime": 0.1758313230238855,
    "sampletime": 8.691919025033712,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 490,
    "reward_mean": 1.7803308604972592,
    "reward_max": 2.13441148689228,
    "reward_min": 1.2084462635684732,
    "reward_std": 0.15277105029984825,
    "timesteps": 168926523,
    "learntime": 0.2199495870154351,
    "sampletime": 8.866000152891502,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 491,
    "reward_mean": 1.7977632417432763,
    "reward_max": 2.2046117741388787,
    "reward_min": 1.443112694000414,
    "reward_std": 0.15308476184142067,
    "timesteps": 169287243,
    "learntime": 0.1735603588167578,
    "sampletime": 8.736757420003414,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 492,
    "reward_mean": 1.817590240614813,
    "reward_max": 2.2663486189364117,
    "reward_min": 1.5271812274182166,
    "reward_std": 0.1658006706442021,
    "timesteps": 169647963,
    "learntime": 0.22195465886034071,
    "sampletime": 8.62614165386185,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 493,
    "reward_mean": 1.7647961530967726,
    "reward_max": 2.162299499889326,
    "reward_min": 1.5208176929648296,
    "reward_std": 0.15567163600947273,
    "timesteps": 170008683,
    "learntime": 0.17019348894245923,
    "sampletime": 8.610182008007541,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 494,
    "reward_mean": 1.8721326383080117,
    "reward_max": 2.333666788759836,
    "reward_min": 1.2960885731606828,
    "reward_std": 0.18390536132436514,
    "timesteps": 170369403,
    "learntime": 0.2366004129871726,
    "sampletime": 8.707741297082976,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 495,
    "reward_mean": 1.8618201011941369,
    "reward_max": 2.289849747277469,
    "reward_min": 1.4973166779840723,
    "reward_std": 0.1692365710698551,
    "timesteps": 170730123,
    "learntime": 0.17735503893345594,
    "sampletime": 8.699799956055358,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 496,
    "reward_mean": 1.8085360566963322,
    "reward_max": 2.1079808090086725,
    "reward_min": 1.321306196500008,
    "reward_std": 0.1838485315835729,
    "timesteps": 171090843,
    "learntime": 0.2368561050388962,
    "sampletime": 8.73357977415435,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 497,
    "reward_mean": 1.8699657573504873,
    "reward_max": 2.153585511399076,
    "reward_min": 1.4666471201785334,
    "reward_std": 0.1361496973740807,
    "timesteps": 171451563,
    "learntime": 0.17600010219030082,
    "sampletime": 8.742618567077443,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 498,
    "reward_mean": 1.4178875171065197,
    "reward_max": 2.2136277307149443,
    "reward_min": -7.993118378354918,
    "reward_std": 1.9751612449133702,
    "timesteps": 171811230,
    "learntime": 0.23374680196866393,
    "sampletime": 8.66122583206743,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 499,
    "reward_mean": 1.0178577964429576,
    "reward_max": 2.306407309218128,
    "reward_min": -7.698079907582286,
    "reward_std": 2.6135581155783045,
    "timesteps": 172169844,
    "learntime": 0.16959836706519127,
    "sampletime": 8.750472897198051,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 500,
    "reward_mean": 1.3196729052939071,
    "reward_max": 2.0734628964547097,
    "reward_min": -8.087060807449182,
    "reward_std": 2.025332949636949,
    "timesteps": 172529511,
    "learntime": 0.21843864885158837,
    "sampletime": 8.755217019002885,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 501,
    "reward_mean": 1.8818471483296513,
    "reward_max": 2.2343020341200304,
    "reward_min": 1.5218421292374822,
    "reward_std": 0.17385927658413178,
    "timesteps": 172890231,
    "learntime": 0.16742507298476994,
    "sampletime": 8.759665908990428,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 502,
    "reward_mean": 1.8240125569797303,
    "reward_max": 2.0798442504425156,
    "reward_min": 1.5555511592661537,
    "reward_std": 0.11847445159325345,
    "timesteps": 173250951,
    "learntime": 0.226243007928133,
    "sampletime": 8.78707693121396,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 503,
    "reward_mean": 1.806364002424136,
    "reward_max": 2.2294811586422507,
    "reward_min": 1.4437104402415082,
    "reward_std": 0.14247364255918943,
    "timesteps": 173611671,
    "learntime": 0.16953636705875397,
    "sampletime": 8.692966349190101,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 504,
    "reward_mean": 1.8038551053363676,
    "reward_max": 2.1861020065173764,
    "reward_min": 1.4265758041504075,
    "reward_std": 0.16391464363503655,
    "timesteps": 173972391,
    "learntime": 0.22101965406909585,
    "sampletime": 8.81982087297365,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 505,
    "reward_mean": 1.7997741936959284,
    "reward_max": 1.9847528272393062,
    "reward_min": 1.4034213740075423,
    "reward_std": 0.12715749430752835,
    "timesteps": 174333111,
    "learntime": 0.17830813792534173,
    "sampletime": 8.83647322608158,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 506,
    "reward_mean": 1.8451063008846342,
    "reward_max": 2.2372338625992216,
    "reward_min": 1.5263290163200098,
    "reward_std": 0.1441513564456978,
    "timesteps": 174693831,
    "learntime": 0.2229365180246532,
    "sampletime": 8.767192161874846,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 507,
    "reward_mean": 1.8485748800411614,
    "reward_max": 2.186918554709388,
    "reward_min": 1.4927486772684242,
    "reward_std": 0.149076682257431,
    "timesteps": 175054551,
    "learntime": 0.1807197469752282,
    "sampletime": 8.691318314056844,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 508,
    "reward_mean": 1.747396216201353,
    "reward_max": 2.1234326597283744,
    "reward_min": 1.4498371344860468,
    "reward_std": 0.13037661722275917,
    "timesteps": 175415271,
    "learntime": 0.21330865612253547,
    "sampletime": 8.729747000150383,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 509,
    "reward_mean": 1.7972126026485074,
    "reward_max": 2.2684678806161327,
    "reward_min": 1.3888272711880143,
    "reward_std": 0.1660197284755515,
    "timesteps": 175775991,
    "learntime": 0.18100956198759377,
    "sampletime": 8.96511246683076,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 510,
    "reward_mean": 1.76935713293978,
    "reward_max": 2.2026202888695416,
    "reward_min": 1.4460011590792499,
    "reward_std": 0.12987037182792205,
    "timesteps": 176136711,
    "learntime": 0.23048901185393333,
    "sampletime": 8.761002819985151,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 511,
    "reward_mean": 1.7743896898016598,
    "reward_max": 2.1530705094161044,
    "reward_min": 1.2907435277752042,
    "reward_std": 0.15439068470373388,
    "timesteps": 176497431,
    "learntime": 0.17361685307696462,
    "sampletime": 8.717220494989306,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 512,
    "reward_mean": 1.350377883111375,
    "reward_max": 2.0699954428780583,
    "reward_min": -7.011352470172853,
    "reward_std": 1.7858881462330893,
    "timesteps": 176857173,
    "learntime": 0.20629059500060976,
    "sampletime": 8.860837289132178,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 513,
    "reward_mean": 1.7586957592185377,
    "reward_max": 2.2445867663834966,
    "reward_min": 1.2841735158934047,
    "reward_std": 0.1693027405478468,
    "timesteps": 177217893,
    "learntime": 0.1654432830400765,
    "sampletime": 8.785108643118292,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 514,
    "reward_mean": 1.8335661916262767,
    "reward_max": 2.1245368173642216,
    "reward_min": 1.4721927256186682,
    "reward_std": 0.13806126269470118,
    "timesteps": 177578613,
    "learntime": 0.2054113489575684,
    "sampletime": 8.901235659141093,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 515,
    "reward_mean": 1.817045917725433,
    "reward_max": 2.2140929346981744,
    "reward_min": 1.4498941650321757,
    "reward_std": 0.16066389045708074,
    "timesteps": 177939333,
    "learntime": 0.17454051808454096,
    "sampletime": 8.731255772989243,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 516,
    "reward_mean": 1.7957562863631984,
    "reward_max": 2.153690760440164,
    "reward_min": 1.4016762540435788,
    "reward_std": 0.13819279458370826,
    "timesteps": 178300053,
    "learntime": 0.2246279870159924,
    "sampletime": 8.71456881891936,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 517,
    "reward_mean": 1.8677505033022619,
    "reward_max": 2.263257668056403,
    "reward_min": 1.3831131750775947,
    "reward_std": 0.13937999608598217,
    "timesteps": 178660773,
    "learntime": 0.17885285103693604,
    "sampletime": 8.7251669568941,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 518,
    "reward_mean": 1.8439516761578285,
    "reward_max": 2.180724747913901,
    "reward_min": 1.513145460923566,
    "reward_std": 0.1444145230197212,
    "timesteps": 179021493,
    "learntime": 0.2116480169352144,
    "sampletime": 8.804325981996953,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 519,
    "reward_mean": 1.866554931397211,
    "reward_max": 2.097604609621953,
    "reward_min": 1.560181332278361,
    "reward_std": 0.12102622170460198,
    "timesteps": 179382213,
    "learntime": 0.16257442999631166,
    "sampletime": 8.905220472952351,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 520,
    "reward_mean": 1.36227056996729,
    "reward_max": 2.090805250047937,
    "reward_min": -7.162186907099872,
    "reward_std": 1.8726630717490313,
    "timesteps": 179741799,
    "learntime": 0.21722809202037752,
    "sampletime": 8.786193053005263,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 521,
    "reward_mean": 1.799478004051339,
    "reward_max": 2.1413932506129054,
    "reward_min": 1.4782635513546543,
    "reward_std": 0.1586454802284001,
    "timesteps": 180102519,
    "learntime": 0.17507027206011117,
    "sampletime": 8.767817146144807,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 522,
    "reward_mean": 1.7639351053491896,
    "reward_max": 2.0603855711788923,
    "reward_min": 1.2489570835540555,
    "reward_std": 0.15853145874859428,
    "timesteps": 180463239,
    "learntime": 0.22372248605825007,
    "sampletime": 8.844889085972682,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 523,
    "reward_mean": 1.4171179814337918,
    "reward_max": 2.283672785481691,
    "reward_min": -7.2628535076827685,
    "reward_std": 1.8491079711651457,
    "timesteps": 180822714,
    "learntime": 0.17236937303096056,
    "sampletime": 8.633763992926106,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 524,
    "reward_mean": 1.407888726781409,
    "reward_max": 2.322820790965729,
    "reward_min": -6.979638167388853,
    "reward_std": 1.849742253987321,
    "timesteps": 181182258,
    "learntime": 0.23257992300204933,
    "sampletime": 8.66676486004144,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 525,
    "reward_mean": 1.8130337455192538,
    "reward_max": 2.062382125232197,
    "reward_min": 1.4456149966272518,
    "reward_std": 0.13544212227272134,
    "timesteps": 181542978,
    "learntime": 0.17122216895222664,
    "sampletime": 8.822886628098786,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 526,
    "reward_mean": 1.8229119874649249,
    "reward_max": 2.3072138941563662,
    "reward_min": 1.3654366164555514,
    "reward_std": 0.1567497902201478,
    "timesteps": 181903698,
    "learntime": 0.17638950305990875,
    "sampletime": 8.947983840946108,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 527,
    "reward_mean": 1.8261380693489255,
    "reward_max": 2.156739577643967,
    "reward_min": 1.4903089284251259,
    "reward_std": 0.1461981379040883,
    "timesteps": 182264418,
    "learntime": 0.19122701906599104,
    "sampletime": 8.874077760148793,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 528,
    "reward_mean": 1.8708496205744685,
    "reward_max": 2.222177024347753,
    "reward_min": 1.5178618250785332,
    "reward_std": 0.1642494729722729,
    "timesteps": 182625138,
    "learntime": 0.1837275840807706,
    "sampletime": 8.733950152993202,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 529,
    "reward_mean": 1.8302837862679533,
    "reward_max": 2.116918739479978,
    "reward_min": 1.5311853917499456,
    "reward_std": 0.14681473478991428,
    "timesteps": 182985858,
    "learntime": 0.18282783101312816,
    "sampletime": 8.745712409960106,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 530,
    "reward_mean": 1.3750238701369377,
    "reward_max": 2.155181129209163,
    "reward_min": -6.667366567559337,
    "reward_std": 1.7720349893991574,
    "timesteps": 183345672,
    "learntime": 0.15814201696775854,
    "sampletime": 8.66979927290231,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 531,
    "reward_mean": 1.2792360675909604,
    "reward_max": 1.9969467656743314,
    "reward_min": -7.740129986809654,
    "reward_std": 1.968069011335141,
    "timesteps": 183705189,
    "learntime": 0.17927586194127798,
    "sampletime": 8.765400464879349,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 532,
    "reward_mean": 1.3906447564919484,
    "reward_max": 2.2203836335166027,
    "reward_min": -7.175873991031429,
    "reward_std": 1.885219916116609,
    "timesteps": 184064751,
    "learntime": 0.21528538316488266,
    "sampletime": 8.75882714590989,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 533,
    "reward_mean": 1.7550067253207655,
    "reward_max": 2.115713277810505,
    "reward_min": 1.4583213243820465,
    "reward_std": 0.15390940257888217,
    "timesteps": 184425471,
    "learntime": 0.17881429218687117,
    "sampletime": 8.708231151103973,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 534,
    "reward_mean": 1.7705215240048862,
    "reward_max": 2.1553333320268626,
    "reward_min": 1.3176269490539907,
    "reward_std": 0.14971250892613333,
    "timesteps": 184786191,
    "learntime": 0.23793200589716434,
    "sampletime": 8.720458596944809,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 535,
    "reward_mean": 1.8573394476573295,
    "reward_max": 2.1071981018176267,
    "reward_min": 1.3212139969462315,
    "reward_std": 0.13538045372547347,
    "timesteps": 185146911,
    "learntime": 0.184313896112144,
    "sampletime": 8.655777710024267,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 536,
    "reward_mean": 1.827741415085882,
    "reward_max": 2.1791423563117815,
    "reward_min": 1.4860780439586505,
    "reward_std": 0.15138248380045616,
    "timesteps": 185507631,
    "learntime": 0.22217959398403764,
    "sampletime": 8.797528171911836,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 537,
    "reward_mean": 1.842436004405765,
    "reward_max": 2.2189814803687913,
    "reward_min": 1.3113863777482122,
    "reward_std": 0.1681775011890989,
    "timesteps": 185868351,
    "learntime": 0.17415869911201298,
    "sampletime": 8.716495260829106,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 538,
    "reward_mean": 1.7466366652581553,
    "reward_max": 2.2876586101651104,
    "reward_min": 1.3709797800159622,
    "reward_std": 0.1499984564915846,
    "timesteps": 186229071,
    "learntime": 0.2201920140068978,
    "sampletime": 8.683823124039918,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 539,
    "reward_mean": 1.7102596577069082,
    "reward_max": 2.064197569831526,
    "reward_min": 1.315151706644839,
    "reward_std": 0.15556984505175772,
    "timesteps": 186589791,
    "learntime": 0.17603270383551717,
    "sampletime": 8.709484171122313,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 540,
    "reward_mean": 1.737550072796779,
    "reward_max": 2.0297885416181396,
    "reward_min": 1.4059494611997643,
    "reward_std": 0.1311506782370034,
    "timesteps": 186950511,
    "learntime": 0.22254964685998857,
    "sampletime": 8.901695006992668,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 541,
    "reward_mean": 1.8605642996715348,
    "reward_max": 2.1700691476862874,
    "reward_min": 1.4242824089746537,
    "reward_std": 0.16456860298302048,
    "timesteps": 187311231,
    "learntime": 0.1900115148164332,
    "sampletime": 8.801474150037393,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 542,
    "reward_mean": 1.8037564945336229,
    "reward_max": 2.2564927880885057,
    "reward_min": 1.4999679426958485,
    "reward_std": 0.1451115486302064,
    "timesteps": 187671951,
    "learntime": 0.22313955309800804,
    "sampletime": 8.7278507060837,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 543,
    "reward_mean": 1.4283338091693367,
    "reward_max": 2.058846670428683,
    "reward_min": -7.263147736137568,
    "reward_std": 1.900195213530468,
    "timesteps": 188031453,
    "learntime": 0.18413822608999908,
    "sampletime": 8.617151188896969,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 544,
    "reward_mean": 1.7948914905573496,
    "reward_max": 2.0913258142124174,
    "reward_min": 1.3267504242054782,
    "reward_std": 0.13999035525394612,
    "timesteps": 188392173,
    "learntime": 0.22751949494704604,
    "sampletime": 8.726143485866487,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 545,
    "reward_mean": 1.8281570643112093,
    "reward_max": 2.3676010775351144,
    "reward_min": 1.4728223870783508,
    "reward_std": 0.16070342700306436,
    "timesteps": 188752893,
    "learntime": 0.17856256407685578,
    "sampletime": 8.856460520066321,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 546,
    "reward_mean": 1.863940393723191,
    "reward_max": 2.085293580390773,
    "reward_min": 1.3667481290908492,
    "reward_std": 0.13366711973991882,
    "timesteps": 189113613,
    "learntime": 0.23797988193109632,
    "sampletime": 8.773114940151572,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 547,
    "reward_mean": 1.8645256577431595,
    "reward_max": 2.182993901489073,
    "reward_min": 1.449116940785833,
    "reward_std": 0.1565674061407851,
    "timesteps": 189474333,
    "learntime": 0.17106960294768214,
    "sampletime": 8.746142370859161,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 548,
    "reward_mean": 1.8552031783645573,
    "reward_max": 2.299483663859338,
    "reward_min": 1.4631063025380044,
    "reward_std": 0.19260803425656545,
    "timesteps": 189835053,
    "learntime": 0.21386604802682996,
    "sampletime": 8.790978142991662,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 549,
    "reward_mean": 1.8690327316942352,
    "reward_max": 2.123020745469888,
    "reward_min": 1.480781696371469,
    "reward_std": 0.1512539214523535,
    "timesteps": 190195773,
    "learntime": 0.18439294304698706,
    "sampletime": 8.694823666941375,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 550,
    "reward_mean": 1.8431514767326407,
    "reward_max": 2.239069471707224,
    "reward_min": 1.5495980523895296,
    "reward_std": 0.15752820085201555,
    "timesteps": 190556493,
    "learntime": 0.21191231696866453,
    "sampletime": 8.946011192863807,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 551,
    "reward_mean": 1.7323594218380722,
    "reward_max": 1.9761503499325799,
    "reward_min": 1.3445435219204436,
    "reward_std": 0.1311134165909926,
    "timesteps": 190917213,
    "learntime": 0.17090410506352782,
    "sampletime": 8.74339504307136,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 552,
    "reward_mean": 1.3006882763212644,
    "reward_max": 2.050990708814367,
    "reward_min": -7.152826697248122,
    "reward_std": 1.8737736908188551,
    "timesteps": 191276901,
    "learntime": 0.24951640889048576,
    "sampletime": 8.726139405043796,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 553,
    "reward_mean": 1.7801023509598495,
    "reward_max": 2.17444339645744,
    "reward_min": 1.40814500749746,
    "reward_std": 0.14863676133844708,
    "timesteps": 191637621,
    "learntime": 0.16990974103100598,
    "sampletime": 8.785599987022579,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 554,
    "reward_mean": 1.7577843220150433,
    "reward_max": 2.116769027307092,
    "reward_min": 1.3987854451277375,
    "reward_std": 0.15766925999197953,
    "timesteps": 191998341,
    "learntime": 0.22312731598503888,
    "sampletime": 8.595223136944696,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 555,
    "reward_mean": 1.7565487455300064,
    "reward_max": 2.042809523726727,
    "reward_min": 1.428896218271828,
    "reward_std": 0.13912574253683269,
    "timesteps": 192359061,
    "learntime": 0.17096396791748703,
    "sampletime": 8.603473857045174,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 556,
    "reward_mean": 1.8258746603328118,
    "reward_max": 2.1811185801264115,
    "reward_min": 1.5025472879325101,
    "reward_std": 0.14485581488731122,
    "timesteps": 192719781,
    "learntime": 0.22509393491782248,
    "sampletime": 8.507920536911115,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 557,
    "reward_mean": 1.7972938688975146,
    "reward_max": 2.1730216523971033,
    "reward_min": 1.394989098972553,
    "reward_std": 0.15194100965914914,
    "timesteps": 193080501,
    "learntime": 0.21787125803530216,
    "sampletime": 8.754727663006634,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 558,
    "reward_mean": 1.8394147455754575,
    "reward_max": 2.194544048896975,
    "reward_min": 1.472366637558892,
    "reward_std": 0.146817466929172,
    "timesteps": 193441221,
    "learntime": 0.17834461387246847,
    "sampletime": 8.754377882927656,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 559,
    "reward_mean": 1.7884872050728786,
    "reward_max": 2.3377856274495206,
    "reward_min": 1.4165494798928362,
    "reward_std": 0.19003781799127334,
    "timesteps": 193801941,
    "learntime": 0.20886902092024684,
    "sampletime": 8.708326115040109,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 560,
    "reward_mean": 1.413734166596036,
    "reward_max": 2.256990612690004,
    "reward_min": -6.960833976161669,
    "reward_std": 1.837812784482014,
    "timesteps": 194161599,
    "learntime": 0.1777804591692984,
    "sampletime": 8.583400781964883,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 561,
    "reward_mean": 1.8226759169558084,
    "reward_max": 2.2066057348045294,
    "reward_min": 1.4633146542420754,
    "reward_std": 0.1687818314915252,
    "timesteps": 194522319,
    "learntime": 0.22450480610132217,
    "sampletime": 8.704569100867957,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 562,
    "reward_mean": 1.837132582567929,
    "reward_max": 2.1407662236809033,
    "reward_min": 1.4602482907022476,
    "reward_std": 0.14655189532446053,
    "timesteps": 194883039,
    "learntime": 0.23427737900055945,
    "sampletime": 8.727662260876969,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 563,
    "reward_mean": 1.3661600794460558,
    "reward_max": 2.057399860342732,
    "reward_min": -6.972427672244411,
    "reward_std": 1.7649550737985422,
    "timesteps": 195242565,
    "learntime": 0.16792831500060856,
    "sampletime": 8.824045730056241,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 564,
    "reward_mean": 1.4211492927943854,
    "reward_max": 2.1663269713965474,
    "reward_min": -7.422871255183552,
    "reward_std": 1.9049693124720861,
    "timesteps": 195602064,
    "learntime": 0.1872363151051104,
    "sampletime": 8.763395549030975,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 565,
    "reward_mean": 1.8016967499879841,
    "reward_max": 2.094044535590164,
    "reward_min": 1.461604949166277,
    "reward_std": 0.13867406017604475,
    "timesteps": 195962784,
    "learntime": 0.23351739207282662,
    "sampletime": 8.77119919611141,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 566,
    "reward_mean": 1.4646894391405385,
    "reward_max": 2.257415161024913,
    "reward_min": -6.888808419956178,
    "reward_std": 1.80974674421337,
    "timesteps": 196322475,
    "learntime": 0.17273221304640174,
    "sampletime": 8.859709199983627,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 567,
    "reward_mean": 0.6175466960413704,
    "reward_max": 2.1857806722594706,
    "reward_min": -7.538074975596942,
    "reward_std": 3.0498629923385594,
    "timesteps": 196680009,
    "learntime": 0.2253143738489598,
    "sampletime": 8.760114541044459,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 568,
    "reward_mean": 1.4102678518833969,
    "reward_max": 2.2991150991601303,
    "reward_min": -6.962859036097532,
    "reward_std": 1.8067912746550394,
    "timesteps": 197039700,
    "learntime": 0.17840453004464507,
    "sampletime": 8.893268575891852,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 569,
    "reward_mean": 1.7775847191692637,
    "reward_max": 2.1448026427745117,
    "reward_min": 1.3236550408101786,
    "reward_std": 0.1740993279477389,
    "timesteps": 197400420,
    "learntime": 0.21789824403822422,
    "sampletime": 8.733269884018227,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 570,
    "reward_mean": 1.4497108988446967,
    "reward_max": 2.1819803650938714,
    "reward_min": -6.9238067751210846,
    "reward_std": 1.8392959305632766,
    "timesteps": 197760087,
    "learntime": 0.17759512388147414,
    "sampletime": 8.670633675996214,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 571,
    "reward_mean": 1.3961602109291102,
    "reward_max": 2.088471622203036,
    "reward_min": -7.109125728112168,
    "reward_std": 1.7742011479998463,
    "timesteps": 198119754,
    "learntime": 0.22630546614527702,
    "sampletime": 8.733552356949076,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 572,
    "reward_mean": 1.754554734242949,
    "reward_max": 2.138685429633671,
    "reward_min": 1.2748194795285288,
    "reward_std": 0.17586841927192648,
    "timesteps": 198480474,
    "learntime": 0.1750248319003731,
    "sampletime": 8.820326385088265,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 573,
    "reward_mean": 1.8322923514299203,
    "reward_max": 2.27569055105524,
    "reward_min": 1.4359902940817502,
    "reward_std": 0.16104116353696032,
    "timesteps": 198841194,
    "learntime": 0.23698775190860033,
    "sampletime": 8.721298201940954,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 574,
    "reward_mean": 1.7879167645083547,
    "reward_max": 2.1477234064994293,
    "reward_min": 1.329282497098159,
    "reward_std": 0.15760253473374283,
    "timesteps": 199201914,
    "learntime": 0.1796656991355121,
    "sampletime": 8.718398020137101,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 575,
    "reward_mean": 1.8015297693163086,
    "reward_max": 2.192535853230055,
    "reward_min": 1.4015319938806678,
    "reward_std": 0.16077332964461988,
    "timesteps": 199562634,
    "learntime": 0.22524524596519768,
    "sampletime": 8.673257695045322,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 576,
    "reward_mean": 1.008214390955045,
    "reward_max": 2.1924991815096933,
    "reward_min": -7.1870841298174755,
    "reward_std": 2.574272841429639,
    "timesteps": 199921479,
    "learntime": 0.18874053517356515,
    "sampletime": 8.71040260209702,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 577,
    "reward_mean": 1.8954752095130762,
    "reward_max": 2.2496917006475,
    "reward_min": 1.5885087646668332,
    "reward_std": 0.14306425139287396,
    "timesteps": 200282199,
    "learntime": 0.21409857901744545,
    "sampletime": 8.779005591990426,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 578,
    "reward_mean": 1.892648842691131,
    "reward_max": 2.2281451189159633,
    "reward_min": 1.5695924089963982,
    "reward_std": 0.1485045201980887,
    "timesteps": 200642919,
    "learntime": 0.1826479178853333,
    "sampletime": 8.75826919497922,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 579,
    "reward_mean": 1.8366784154226052,
    "reward_max": 2.1883323178697136,
    "reward_min": 1.5095164407111652,
    "reward_std": 0.1462902868516682,
    "timesteps": 201003639,
    "learntime": 0.23072728794068098,
    "sampletime": 8.867087913211435,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 580,
    "reward_mean": 1.3845556953717633,
    "reward_max": 2.225006548985909,
    "reward_min": -7.140986553559111,
    "reward_std": 1.8361305630355118,
    "timesteps": 201363159,
    "learntime": 0.18737380811944604,
    "sampletime": 8.579398585949093,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 581,
    "reward_mean": 1.8058596796438635,
    "reward_max": 2.2008765641965304,
    "reward_min": 1.466373751158681,
    "reward_std": 0.14146710675787016,
    "timesteps": 201723879,
    "learntime": 0.22149055800400674,
    "sampletime": 8.867308922111988,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 582,
    "reward_mean": 1.781964006938837,
    "reward_max": 2.0982660866357015,
    "reward_min": 1.4669575679452234,
    "reward_std": 0.1553936002895613,
    "timesteps": 202084599,
    "learntime": 0.18333693803288043,
    "sampletime": 8.644659760175273,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 583,
    "reward_mean": 1.4416566408543847,
    "reward_max": 2.3578147153523505,
    "reward_min": -14.630246362450835,
    "reward_std": 2.315370703760151,
    "timesteps": 202444149,
    "learntime": 0.22597528295591474,
    "sampletime": 8.722785959020257,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 584,
    "reward_mean": 1.7705204877615544,
    "reward_max": 2.162864464522112,
    "reward_min": 1.434524084804718,
    "reward_std": 0.13048468424428789,
    "timesteps": 202804869,
    "learntime": 0.18721837108023465,
    "sampletime": 8.672540449071676,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 585,
    "reward_mean": 1.7630484868588412,
    "reward_max": 2.1454979939612007,
    "reward_min": 1.4769915848155468,
    "reward_std": 0.14790785313708643,
    "timesteps": 203165589,
    "learntime": 0.23201430798508227,
    "sampletime": 8.82981317397207,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 586,
    "reward_mean": 1.7855164740403655,
    "reward_max": 2.2059202744999427,
    "reward_min": 1.454967169239267,
    "reward_std": 0.15141963101221395,
    "timesteps": 203526309,
    "learntime": 0.17709892080165446,
    "sampletime": 8.965723141096532,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 587,
    "reward_mean": 1.7808493419334122,
    "reward_max": 2.189927950999732,
    "reward_min": 1.4658882226371601,
    "reward_std": 0.1146770861763714,
    "timesteps": 203887029,
    "learntime": 0.22393759596161544,
    "sampletime": 8.762029021047056,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 588,
    "reward_mean": 1.8563748716148196,
    "reward_max": 2.2213990671787704,
    "reward_min": 1.4231585233523416,
    "reward_std": 0.16493657180379223,
    "timesteps": 204247749,
    "learntime": 0.17422428587451577,
    "sampletime": 8.8169345788192,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 589,
    "reward_mean": 1.8248577348528618,
    "reward_max": 2.16224907658276,
    "reward_min": 1.4190584756857285,
    "reward_std": 0.17165391815583453,
    "timesteps": 204608469,
    "learntime": 0.24320833897218108,
    "sampletime": 8.784439370036125,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 590,
    "reward_mean": 1.3847799215941015,
    "reward_max": 2.096051202945199,
    "reward_min": -15.884695450131515,
    "reward_std": 2.4294790793391687,
    "timesteps": 204968196,
    "learntime": 0.19243942596949637,
    "sampletime": 8.75759800313972,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 591,
    "reward_mean": 1.7946121196102334,
    "reward_max": 2.225225452227856,
    "reward_min": 1.4508067437228875,
    "reward_std": 0.1568430787033212,
    "timesteps": 205328916,
    "learntime": 0.213681410998106,
    "sampletime": 8.63723264192231,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 592,
    "reward_mean": 1.8630081639420697,
    "reward_max": 2.2468078043711475,
    "reward_min": 1.5062928490480034,
    "reward_std": 0.17100415961990836,
    "timesteps": 205689636,
    "learntime": 0.17654443811625242,
    "sampletime": 8.722823695046827,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 593,
    "reward_mean": 1.79171542058019,
    "reward_max": 2.340829390713195,
    "reward_min": 1.359795588437749,
    "reward_std": 0.18984416403367954,
    "timesteps": 206050356,
    "learntime": 0.22846547118388116,
    "sampletime": 8.891290633007884,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 594,
    "reward_mean": 1.839555797240433,
    "reward_max": 2.3399020059571,
    "reward_min": 1.3334633031627148,
    "reward_std": 0.17512822095297395,
    "timesteps": 206411076,
    "learntime": 0.18142023915424943,
    "sampletime": 8.626913703978062,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 595,
    "reward_mean": 1.8840383732827486,
    "reward_max": 2.2990537173818875,
    "reward_min": 1.5868347570173078,
    "reward_std": 0.148546903319008,
    "timesteps": 206771796,
    "learntime": 0.21734172198921442,
    "sampletime": 8.718648694921285,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 596,
    "reward_mean": 1.9155203951800504,
    "reward_max": 2.3518206279735403,
    "reward_min": 1.5315054388713276,
    "reward_std": 0.15689630626768283,
    "timesteps": 207132516,
    "learntime": 0.18605667003430426,
    "sampletime": 8.711386961163953,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 597,
    "reward_mean": 1.823437665068632,
    "reward_max": 2.114750667423128,
    "reward_min": 1.4472254150605266,
    "reward_std": 0.16721069262054727,
    "timesteps": 207493236,
    "learntime": 0.2421216550283134,
    "sampletime": 8.62096771900542,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 598,
    "reward_mean": 1.8408148777137376,
    "reward_max": 2.2313513939481027,
    "reward_min": 1.5192180222533551,
    "reward_std": 0.13245411223717304,
    "timesteps": 207853956,
    "learntime": 0.172772723948583,
    "sampletime": 8.669115547090769,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 599,
    "reward_mean": 1.7625919844523867,
    "reward_max": 2.1055282786385026,
    "reward_min": 1.4278768303774967,
    "reward_std": 0.12582485989891742,
    "timesteps": 208214676,
    "learntime": 0.17072033905424178,
    "sampletime": 8.796031187986955,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 600,
    "reward_mean": 1.7752374109212172,
    "reward_max": 1.9973524682943429,
    "reward_min": 1.5489673076016388,
    "reward_std": 0.12475442724558232,
    "timesteps": 208575396,
    "learntime": 0.18154754606075585,
    "sampletime": 8.768205789849162,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 601,
    "reward_mean": 1.7487129778526078,
    "reward_max": 2.0269318158137697,
    "reward_min": 1.360617895465991,
    "reward_std": 0.1364443548925319,
    "timesteps": 208936116,
    "learntime": 0.1129490218590945,
    "sampletime": 8.62166512105614,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 602,
    "reward_mean": 1.7513469450751304,
    "reward_max": 2.0685973998695366,
    "reward_min": 1.5486715997950236,
    "reward_std": 0.13801521145382506,
    "timesteps": 209296836,
    "learntime": 0.23548520100302994,
    "sampletime": 8.624095991021022,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 603,
    "reward_mean": 1.413493387337597,
    "reward_max": 2.3313444301020345,
    "reward_min": -7.465860246123296,
    "reward_std": 1.952994344200406,
    "timesteps": 209656290,
    "learntime": 0.17662307410500944,
    "sampletime": 8.638652913970873,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 604,
    "reward_mean": 1.4612462284696668,
    "reward_max": 2.192533960894003,
    "reward_min": -7.518600518992326,
    "reward_std": 1.8964662170008995,
    "timesteps": 210015744,
    "learntime": 0.23043203516863286,
    "sampletime": 8.60862625297159,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 605,
    "reward_mean": 1.8229665996943991,
    "reward_max": 2.098810666784681,
    "reward_min": 1.4580828353443338,
    "reward_std": 0.1611727745792663,
    "timesteps": 210376464,
    "learntime": 0.1857748031616211,
    "sampletime": 8.604587169829756,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 606,
    "reward_mean": 1.7447235134285954,
    "reward_max": 2.0794458877344635,
    "reward_min": 1.401401819813392,
    "reward_std": 0.15600160357726114,
    "timesteps": 210737184,
    "learntime": 0.2157578261103481,
    "sampletime": 8.757426367839798,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 607,
    "reward_mean": 1.755988683925143,
    "reward_max": 2.049046002512719,
    "reward_min": 1.4855289468188921,
    "reward_std": 0.14416135728878854,
    "timesteps": 211097904,
    "learntime": 0.18032432906329632,
    "sampletime": 8.574312990996987,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 608,
    "reward_mean": 1.835035460543388,
    "reward_max": 2.1616671462194934,
    "reward_min": 1.4840993433187526,
    "reward_std": 0.14038003927113143,
    "timesteps": 211458624,
    "learntime": 0.228506542975083,
    "sampletime": 8.740591251058504,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 609,
    "reward_mean": 1.8469427241836187,
    "reward_max": 2.191159961376493,
    "reward_min": 1.4674536850440987,
    "reward_std": 0.16304746982033216,
    "timesteps": 211819344,
    "learntime": 0.17738216510042548,
    "sampletime": 8.688799876952544,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 610,
    "reward_mean": 1.8057755145591277,
    "reward_max": 2.0793021655973067,
    "reward_min": 1.47845923385378,
    "reward_std": 0.13995771892073394,
    "timesteps": 212180064,
    "learntime": 0.22655826690606773,
    "sampletime": 8.746307784924284,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 611,
    "reward_mean": 1.7935608776648688,
    "reward_max": 2.242034716873825,
    "reward_min": 1.4042661483294447,
    "reward_std": 0.17164620268557124,
    "timesteps": 212540784,
    "learntime": 0.1764084380120039,
    "sampletime": 8.711165129905567,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 612,
    "reward_mean": 1.8357749487554784,
    "reward_max": 2.2785634395479426,
    "reward_min": 1.4757711728540877,
    "reward_std": 0.15973690045373692,
    "timesteps": 212901504,
    "learntime": 0.20632901601493359,
    "sampletime": 8.7437526229769,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 613,
    "reward_mean": 1.8317461322291806,
    "reward_max": 2.169506820024583,
    "reward_min": 1.5919999530923412,
    "reward_std": 0.1454522179859064,
    "timesteps": 213262224,
    "learntime": 0.1852601650170982,
    "sampletime": 8.726814344990999,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 614,
    "reward_mean": 1.8988206323804027,
    "reward_max": 2.3475153649536256,
    "reward_min": 1.6341194289590613,
    "reward_std": 0.1462344866942046,
    "timesteps": 213622944,
    "learntime": 0.2479075298178941,
    "sampletime": 8.795253666117787,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 615,
    "reward_mean": 1.815399894635822,
    "reward_max": 2.3430523560029646,
    "reward_min": 1.4607398763799915,
    "reward_std": 0.17724480246993232,
    "timesteps": 213983664,
    "learntime": 0.18086385913193226,
    "sampletime": 8.888663864927366,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 616,
    "reward_mean": 1.7703503062886738,
    "reward_max": 2.1209140815190017,
    "reward_min": 1.4411182832845915,
    "reward_std": 0.14714656632841763,
    "timesteps": 214344384,
    "learntime": 0.23563787806779146,
    "sampletime": 8.677683643996716,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 617,
    "reward_mean": 1.8269237901781992,
    "reward_max": 2.117922883678338,
    "reward_min": 1.4535365634963222,
    "reward_std": 0.13234749454086248,
    "timesteps": 214705104,
    "learntime": 0.1746207349933684,
    "sampletime": 8.761187074938789,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 618,
    "reward_mean": 1.8870165164670007,
    "reward_max": 2.190286496879926,
    "reward_min": 1.5840106952977762,
    "reward_std": 0.14479602959820184,
    "timesteps": 215065824,
    "learntime": 0.2405034899711609,
    "sampletime": 8.656768886139616,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 619,
    "reward_mean": 1.9566750899555363,
    "reward_max": 2.464076336286475,
    "reward_min": 1.5233658754044528,
    "reward_std": 0.19197110568580575,
    "timesteps": 215426544,
    "learntime": 0.17908146395348012,
    "sampletime": 8.705707625951618,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 620,
    "reward_mean": 1.9036075115458826,
    "reward_max": 2.2817077470458673,
    "reward_min": 1.5959988510603018,
    "reward_std": 0.15663780078150302,
    "timesteps": 215787264,
    "learntime": 0.23252172907814384,
    "sampletime": 8.74751635408029,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 621,
    "reward_mean": 1.7757850338231445,
    "reward_max": 2.2211214632001357,
    "reward_min": 1.4897929195140005,
    "reward_std": 0.1677097650880994,
    "timesteps": 216147984,
    "learntime": 0.17575474991463125,
    "sampletime": 8.695029421942309,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 622,
    "reward_mean": 1.85021621605076,
    "reward_max": 2.225400336806405,
    "reward_min": 1.4558398920520559,
    "reward_std": 0.17786107762290582,
    "timesteps": 216508704,
    "learntime": 0.2371534809935838,
    "sampletime": 8.69564625993371,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 623,
    "reward_mean": 1.8431354090225576,
    "reward_max": 2.3180939280605823,
    "reward_min": 1.5897972570585066,
    "reward_std": 0.1361717915623311,
    "timesteps": 216869424,
    "learntime": 0.19151952117681503,
    "sampletime": 8.764447182882577,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 624,
    "reward_mean": 1.8168327893813832,
    "reward_max": 2.260832789000837,
    "reward_min": 1.450316360458433,
    "reward_std": 0.16528692507156686,
    "timesteps": 217230144,
    "learntime": 0.2393208749126643,
    "sampletime": 8.741960644954816,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 625,
    "reward_mean": 1.8058573687092547,
    "reward_max": 2.1177152233237106,
    "reward_min": 1.4479005340712503,
    "reward_std": 0.14549995264851126,
    "timesteps": 217590864,
    "learntime": 0.17936581606045365,
    "sampletime": 8.64318911684677,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 626,
    "reward_mean": 1.8206658818978747,
    "reward_max": 2.259095618175649,
    "reward_min": 1.4325950239160132,
    "reward_std": 0.15085714764770447,
    "timesteps": 217951584,
    "learntime": 0.22235619113780558,
    "sampletime": 8.636491874000058,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 627,
    "reward_mean": 1.7955287858799216,
    "reward_max": 2.378519157078256,
    "reward_min": 1.4801150876260651,
    "reward_std": 0.14798004671011725,
    "timesteps": 218312304,
    "learntime": 0.18308549281209707,
    "sampletime": 8.804449398070574,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 628,
    "reward_mean": 1.7660128994526578,
    "reward_max": 2.159029520309007,
    "reward_min": 1.4056423975747396,
    "reward_std": 0.154196575528102,
    "timesteps": 218673024,
    "learntime": 0.18292202707380056,
    "sampletime": 8.756333740893751,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 629,
    "reward_mean": 1.8015300550224183,
    "reward_max": 2.1212639859701112,
    "reward_min": 1.2771470396793563,
    "reward_std": 0.16201028941509404,
    "timesteps": 219033744,
    "learntime": 0.18365591508336365,
    "sampletime": 8.764964937930927,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 630,
    "reward_mean": 1.753569464529559,
    "reward_max": 2.07410588858395,
    "reward_min": 1.490802552842068,
    "reward_std": 0.14078956467718634,
    "timesteps": 219394464,
    "learntime": 0.2399510929826647,
    "sampletime": 8.76742993388325,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 631,
    "reward_mean": 1.7693258401897132,
    "reward_max": 2.143795381247234,
    "reward_min": 1.3951851469358738,
    "reward_std": 0.15398424222132656,
    "timesteps": 219755184,
    "learntime": 0.17941351816989481,
    "sampletime": 8.768380673136562,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 632,
    "reward_mean": 1.8295773950271697,
    "reward_max": 2.187883957868588,
    "reward_min": 1.455766958294339,
    "reward_std": 0.15321575558851933,
    "timesteps": 220115904,
    "learntime": 0.17934601311571896,
    "sampletime": 8.813191181980073,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 633,
    "reward_mean": 1.8590144685920305,
    "reward_max": 2.3429988773634887,
    "reward_min": 1.53748756487656,
    "reward_std": 0.17483356421538046,
    "timesteps": 220476624,
    "learntime": 0.18027963815256953,
    "sampletime": 8.713248032145202,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 634,
    "reward_mean": 1.9160257167053003,
    "reward_max": 2.2417602183184364,
    "reward_min": 1.6478839141006254,
    "reward_std": 0.12669674660790856,
    "timesteps": 220837344,
    "learntime": 0.1875720340758562,
    "sampletime": 8.810965589946136,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 635,
    "reward_mean": 1.4438685678887584,
    "reward_max": 2.172986847510782,
    "reward_min": -7.4709732111995,
    "reward_std": 1.922619711260903,
    "timesteps": 221196876,
    "learntime": 0.1775204250589013,
    "sampletime": 8.721412954153493,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 636,
    "reward_mean": 1.8004324259130238,
    "reward_max": 2.146739297126644,
    "reward_min": 1.4276315602368066,
    "reward_std": 0.15861497719775422,
    "timesteps": 221557596,
    "learntime": 0.1818614408839494,
    "sampletime": 8.799004175001755,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 637,
    "reward_mean": 1.7647622031458456,
    "reward_max": 2.062624563338678,
    "reward_min": 1.3613178502189693,
    "reward_std": 0.15046552184700754,
    "timesteps": 221918316,
    "learntime": 0.18482359312474728,
    "sampletime": 8.993704941822216,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 638,
    "reward_mean": 1.7702072375315554,
    "reward_max": 2.1664382998203595,
    "reward_min": 1.383094376184288,
    "reward_std": 0.16618010803126898,
    "timesteps": 222279036,
    "learntime": 0.179353890940547,
    "sampletime": 8.697096223011613,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 639,
    "reward_mean": 1.3846498455661997,
    "reward_max": 2.195380764006224,
    "reward_min": -7.43157361686992,
    "reward_std": 1.867663809759805,
    "timesteps": 222638736,
    "learntime": 0.18271016515791416,
    "sampletime": 8.711369250901043,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 640,
    "reward_mean": 1.788251751398926,
    "reward_max": 2.086127815432984,
    "reward_min": 1.4597352684570701,
    "reward_std": 0.14015900032340115,
    "timesteps": 222999456,
    "learntime": 0.18620053306221962,
    "sampletime": 8.802766592940316,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 641,
    "reward_mean": 1.7497127037885536,
    "reward_max": 2.1627001243354163,
    "reward_min": 1.3446902489751755,
    "reward_std": 0.15648656639608663,
    "timesteps": 223360176,
    "learntime": 0.17889574216678739,
    "sampletime": 8.774382625939324,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 642,
    "reward_mean": 1.7775910574777567,
    "reward_max": 2.1234867475242463,
    "reward_min": 1.476479665030525,
    "reward_std": 0.16197940088841203,
    "timesteps": 223720896,
    "learntime": 0.1836614259518683,
    "sampletime": 8.898330197902396,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 643,
    "reward_mean": 1.8374143952753743,
    "reward_max": 2.1578297930326573,
    "reward_min": 1.4801605482123577,
    "reward_std": 0.14313981388568064,
    "timesteps": 224081616,
    "learntime": 0.17908337689004838,
    "sampletime": 8.697412859881297,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 644,
    "reward_mean": 1.8710839895894371,
    "reward_max": 2.2339784179498405,
    "reward_min": 1.5827666717355648,
    "reward_std": 0.13671458664928754,
    "timesteps": 224442336,
    "learntime": 0.18477199994958937,
    "sampletime": 8.801642443984747,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 645,
    "reward_mean": 1.8481693701451687,
    "reward_max": 2.343736558722217,
    "reward_min": 1.5140245283731573,
    "reward_std": 0.1762282450913297,
    "timesteps": 224803056,
    "learntime": 0.19833079096861184,
    "sampletime": 8.712342796148732,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 646,
    "reward_mean": 1.8106609940548761,
    "reward_max": 2.1986589929696865,
    "reward_min": 1.481177719963435,
    "reward_std": 0.142032574398367,
    "timesteps": 225163776,
    "learntime": 0.17829635995440185,
    "sampletime": 8.857624999945983,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 647,
    "reward_mean": 1.8284565135771844,
    "reward_max": 2.1719051654686643,
    "reward_min": 1.538445498464471,
    "reward_std": 0.14758789573967457,
    "timesteps": 225524496,
    "learntime": 0.18251303979195654,
    "sampletime": 8.74102105689235,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 648,
    "reward_mean": 1.845741845369828,
    "reward_max": 2.214617479571393,
    "reward_min": 1.472153558358319,
    "reward_std": 0.15380297907946805,
    "timesteps": 225885216,
    "learntime": 0.18300593714229763,
    "sampletime": 8.790960642974824,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 649,
    "reward_mean": 1.7844757454686622,
    "reward_max": 2.1239968094389146,
    "reward_min": 1.370915829052328,
    "reward_std": 0.14955023023979197,
    "timesteps": 226245936,
    "learntime": 0.1774041960015893,
    "sampletime": 8.787369463127106,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 650,
    "reward_mean": 1.8535116889940346,
    "reward_max": 2.3094555412826585,
    "reward_min": 1.5031254282597102,
    "reward_std": 0.18480566863312675,
    "timesteps": 226606656,
    "learntime": 0.184899325016886,
    "sampletime": 8.734731717035174,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 651,
    "reward_mean": 1.3307015045322954,
    "reward_max": 2.0197148483452043,
    "reward_min": -7.133676736192272,
    "reward_std": 1.8686059626465725,
    "timesteps": 226966278,
    "learntime": 0.19520649407058954,
    "sampletime": 8.874493753071874,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 652,
    "reward_mean": 1.8251597313531107,
    "reward_max": 2.2125958536723322,
    "reward_min": 1.4231759248469809,
    "reward_std": 0.15395452649630603,
    "timesteps": 227326998,
    "learntime": 0.18125218409113586,
    "sampletime": 8.759692359017208,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 653,
    "reward_mean": 1.7902900122260474,
    "reward_max": 2.2565505993693566,
    "reward_min": 1.2447105884255651,
    "reward_std": 0.18325294544218035,
    "timesteps": 227687718,
    "learntime": 0.18451141682453454,
    "sampletime": 8.746644002152607,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 654,
    "reward_mean": 1.759978570528895,
    "reward_max": 2.215016295779078,
    "reward_min": 1.37122572603226,
    "reward_std": 0.16304242406041117,
    "timesteps": 228048438,
    "learntime": 0.17549462104216218,
    "sampletime": 8.823562416015193,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 655,
    "reward_mean": 1.762400937573999,
    "reward_max": 2.2195402629228957,
    "reward_min": 1.330326518105169,
    "reward_std": 0.1830007211470157,
    "timesteps": 228409158,
    "learntime": 0.18651870894245803,
    "sampletime": 8.80623413901776,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 656,
    "reward_mean": 1.7704402996623432,
    "reward_max": 2.1088539574852656,
    "reward_min": 1.3584554218986948,
    "reward_std": 0.1473846274051081,
    "timesteps": 228769878,
    "learntime": 0.20056509296409786,
    "sampletime": 8.696146978996694,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 657,
    "reward_mean": 1.8468656645743518,
    "reward_max": 2.1001482036768997,
    "reward_min": 1.4841575393780415,
    "reward_std": 0.14491552360741766,
    "timesteps": 229130598,
    "learntime": 0.18109884997829795,
    "sampletime": 8.730514785042033,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 658,
    "reward_mean": 1.8294070441566723,
    "reward_max": 2.1934342327824004,
    "reward_min": 1.589785665545299,
    "reward_std": 0.13409738332780952,
    "timesteps": 229491318,
    "learntime": 0.19305663905106485,
    "sampletime": 8.821594537934288,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 659,
    "reward_mean": 1.3646857440715563,
    "reward_max": 2.128812896144207,
    "reward_min": -7.315671457856135,
    "reward_std": 1.9082890581479786,
    "timesteps": 229850919,
    "learntime": 0.18421896104700863,
    "sampletime": 8.749686107970774,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 660,
    "reward_mean": 0.9388403866169637,
    "reward_max": 2.1243634897568175,
    "reward_min": -7.397133919413937,
    "reward_std": 2.5618664896534544,
    "timesteps": 230209401,
    "learntime": 0.1858538610395044,
    "sampletime": 8.69917094311677,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 661,
    "reward_mean": 1.346564921095803,
    "reward_max": 2.2945304360553993,
    "reward_min": -6.927357249843863,
    "reward_std": 1.7468643787737248,
    "timesteps": 230569002,
    "learntime": 0.18983347807079554,
    "sampletime": 8.65574633399956,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 662,
    "reward_mean": 1.772558366610908,
    "reward_max": 2.1920353653875972,
    "reward_min": 1.4340660375180743,
    "reward_std": 0.16512025214443815,
    "timesteps": 230929722,
    "learntime": 0.18272708100266755,
    "sampletime": 8.651880261022598,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 663,
    "reward_mean": 1.8510609511594986,
    "reward_max": 2.36518509515074,
    "reward_min": 1.4826233641978197,
    "reward_std": 0.16390649285196468,
    "timesteps": 231290442,
    "learntime": 0.18949419213458896,
    "sampletime": 8.745159676996991,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 664,
    "reward_mean": 1.8388450624862256,
    "reward_max": 2.236919591325035,
    "reward_min": 1.4857279454302998,
    "reward_std": 0.1549961923593186,
    "timesteps": 231651162,
    "learntime": 0.18468315503560007,
    "sampletime": 8.84111569612287,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 665,
    "reward_mean": 1.8287808370639915,
    "reward_max": 2.1348204830552038,
    "reward_min": 1.4899629860693948,
    "reward_std": 0.13744008257264936,
    "timesteps": 232011882,
    "learntime": 0.19549439218826592,
    "sampletime": 8.784561205189675,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 666,
    "reward_mean": 1.7957037724857388,
    "reward_max": 2.1245400083328887,
    "reward_min": 1.5279687526263919,
    "reward_std": 0.127561379801121,
    "timesteps": 232372602,
    "learntime": 0.17346584401093423,
    "sampletime": 8.712174744810909,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 667,
    "reward_mean": 1.8231036792887183,
    "reward_max": 2.0792309326281977,
    "reward_min": 1.5879463903485962,
    "reward_std": 0.12233075336336524,
    "timesteps": 232733322,
    "learntime": 0.1753567059058696,
    "sampletime": 8.693047954933718,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 668,
    "reward_mean": 1.826733944709401,
    "reward_max": 2.1139366586540915,
    "reward_min": 1.5213867041165914,
    "reward_std": 0.13954708906101962,
    "timesteps": 233094042,
    "learntime": 0.18020970304496586,
    "sampletime": 8.75725802197121,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 669,
    "reward_mean": 1.7916136695414888,
    "reward_max": 2.2297251352733407,
    "reward_min": 1.2725970654185694,
    "reward_std": 0.17899136465742185,
    "timesteps": 233454762,
    "learntime": 0.18491172487847507,
    "sampletime": 8.73338974895887,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 670,
    "reward_mean": 1.7877707143419177,
    "reward_max": 2.0921275319369355,
    "reward_min": 1.4918924275570467,
    "reward_std": 0.1328175180252871,
    "timesteps": 233815482,
    "learntime": 0.1870156980585307,
    "sampletime": 8.740379834081978,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 671,
    "reward_mean": 1.8353740581970137,
    "reward_max": 2.186766343861093,
    "reward_min": 1.3730226477509269,
    "reward_std": 0.17396581872288244,
    "timesteps": 234176202,
    "learntime": 0.1791278631426394,
    "sampletime": 8.86447203392163,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 672,
    "reward_mean": 1.829586553189296,
    "reward_max": 2.1910168630161517,
    "reward_min": 1.472762663936006,
    "reward_std": 0.14792460364392254,
    "timesteps": 234536922,
    "learntime": 0.18803465296514332,
    "sampletime": 8.874368961900473,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 673,
    "reward_mean": 1.8317097033559868,
    "reward_max": 2.10982226234222,
    "reward_min": 1.5606168721137523,
    "reward_std": 0.1237092589366308,
    "timesteps": 234897642,
    "learntime": 0.18023702688515186,
    "sampletime": 8.68030822603032,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 674,
    "reward_mean": 1.8909190125852051,
    "reward_max": 2.2172631865003907,
    "reward_min": 1.586458542364802,
    "reward_std": 0.15270243767810554,
    "timesteps": 235258362,
    "learntime": 0.18297290499322116,
    "sampletime": 8.747071409132332,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 675,
    "reward_mean": 1.9272244174404916,
    "reward_max": 2.30642200266734,
    "reward_min": 1.5587211228751867,
    "reward_std": 0.14600903754507316,
    "timesteps": 235619082,
    "learntime": 0.18581477482803166,
    "sampletime": 8.717329006874934,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 676,
    "reward_mean": 1.83758883186375,
    "reward_max": 2.1853197970665614,
    "reward_min": 1.3487572315275556,
    "reward_std": 0.14845457334434353,
    "timesteps": 235979802,
    "learntime": 0.18074978003278375,
    "sampletime": 8.651621748926118,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 677,
    "reward_mean": 1.7222010318667602,
    "reward_max": 2.074601461557462,
    "reward_min": 1.3065578730024223,
    "reward_std": 0.16220045359297575,
    "timesteps": 236340522,
    "learntime": 0.18849747302010655,
    "sampletime": 8.769515705062076,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 678,
    "reward_mean": 1.7616657129814652,
    "reward_max": 2.307063769884265,
    "reward_min": 1.3488773848106497,
    "reward_std": 0.1854397945316524,
    "timesteps": 236701242,
    "learntime": 0.19201201596297324,
    "sampletime": 8.743220496922731,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 679,
    "reward_mean": 1.733421366052346,
    "reward_max": 2.0775807799143458,
    "reward_min": 1.3826648526517202,
    "reward_std": 0.15935524770824533,
    "timesteps": 237061962,
    "learntime": 0.18182333814911544,
    "sampletime": 8.87304966407828,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 680,
    "reward_mean": 1.8652311227733418,
    "reward_max": 2.2709702705879757,
    "reward_min": 1.423024704155534,
    "reward_std": 0.17239702717649275,
    "timesteps": 237422682,
    "learntime": 0.18511769594624639,
    "sampletime": 8.705430340021849,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 681,
    "reward_mean": 1.851590598977795,
    "reward_max": 2.217272043000607,
    "reward_min": 1.4800833733849361,
    "reward_std": 0.14764060131789747,
    "timesteps": 237783402,
    "learntime": 0.1816633779089898,
    "sampletime": 8.811385303968564,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 682,
    "reward_mean": 1.387283794845739,
    "reward_max": 2.1318340557402475,
    "reward_min": -7.203090656670008,
    "reward_std": 1.891456453015329,
    "timesteps": 238143087,
    "learntime": 0.18316954700276256,
    "sampletime": 8.852395790163428,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 683,
    "reward_mean": 0.849559786018425,
    "reward_max": 1.9896198733826351,
    "reward_min": -17.350101143578566,
    "reward_std": 3.214134605980074,
    "timesteps": 238501737,
    "learntime": 0.18026336911134422,
    "sampletime": 8.681327607948333,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 684,
    "reward_mean": 1.7252223625029646,
    "reward_max": 2.039779002915814,
    "reward_min": 1.245244729073923,
    "reward_std": 0.17767351907829979,
    "timesteps": 238862457,
    "learntime": 0.18128288420848548,
    "sampletime": 8.799840786959976,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 685,
    "reward_mean": 1.8158152956646718,
    "reward_max": 2.3363165392356935,
    "reward_min": 1.4563070623641523,
    "reward_std": 0.20020295374825292,
    "timesteps": 239223177,
    "learntime": 0.19028072711080313,
    "sampletime": 8.720595167018473,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 686,
    "reward_mean": 1.787263309301164,
    "reward_max": 2.2704711382058567,
    "reward_min": 1.4010475412660237,
    "reward_std": 0.15131952916717128,
    "timesteps": 239583897,
    "learntime": 0.18508673994801939,
    "sampletime": 8.760674493853003,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 687,
    "reward_mean": 1.8089958384524039,
    "reward_max": 2.1264137879215075,
    "reward_min": 1.4690802392821432,
    "reward_std": 0.15286082050863412,
    "timesteps": 239944617,
    "learntime": 0.1875828979536891,
    "sampletime": 8.643419033149257,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 688,
    "reward_mean": 1.8273978653923808,
    "reward_max": 2.270299703226752,
    "reward_min": 1.4770792789883336,
    "reward_std": 0.18131336738503667,
    "timesteps": 240305337,
    "learntime": 0.18477680790238082,
    "sampletime": 8.683708735043183,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 689,
    "reward_mean": 1.7733653809887877,
    "reward_max": 2.219091567182629,
    "reward_min": 1.0515744249384023,
    "reward_std": 0.2088693170640365,
    "timesteps": 240666057,
    "learntime": 0.1914639608003199,
    "sampletime": 8.659478161949664,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 690,
    "reward_mean": 1.8070349838908695,
    "reward_max": 2.1535406114734603,
    "reward_min": 1.4658920178225123,
    "reward_std": 0.15595220128378448,
    "timesteps": 241026777,
    "learntime": 0.1869032639078796,
    "sampletime": 8.824209508951753,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 691,
    "reward_mean": 1.2953323795547902,
    "reward_max": 2.0765790625080207,
    "reward_min": -7.372890829253294,
    "reward_std": 1.893922175244105,
    "timesteps": 241386291,
    "learntime": 0.18849780899472535,
    "sampletime": 8.70446231495589,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 692,
    "reward_mean": 1.7458994242329835,
    "reward_max": 2.123794507094619,
    "reward_min": 1.3572863563643585,
    "reward_std": 0.1497332736003635,
    "timesteps": 241747011,
    "learntime": 0.1828792050946504,
    "sampletime": 8.646119283977896,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 693,
    "reward_mean": 1.8494403768989298,
    "reward_max": 2.219848836466551,
    "reward_min": 1.461120582032227,
    "reward_std": 0.1544109232646162,
    "timesteps": 242107731,
    "learntime": 0.19034361583180726,
    "sampletime": 8.750546423019841,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 694,
    "reward_mean": 1.8758956409230627,
    "reward_max": 2.178296658191051,
    "reward_min": 1.4400628727223965,
    "reward_std": 0.15426429994139387,
    "timesteps": 242468451,
    "learntime": 0.18660103809088469,
    "sampletime": 8.753554024035111,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 695,
    "reward_mean": 1.8087125418947512,
    "reward_max": 2.1927885716766875,
    "reward_min": 1.4541865798307803,
    "reward_std": 0.14197460704975692,
    "timesteps": 242829171,
    "learntime": 0.19336515408940613,
    "sampletime": 8.628686501877382,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 696,
    "reward_mean": 1.7777398482957143,
    "reward_max": 2.101101664398534,
    "reward_min": 1.502243950560856,
    "reward_std": 0.12309592303025571,
    "timesteps": 243189891,
    "learntime": 0.18827971909195185,
    "sampletime": 8.74166627600789,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 697,
    "reward_mean": 0.9666236413420219,
    "reward_max": 2.273940701891354,
    "reward_min": -16.20327052771013,
    "reward_std": 3.039562457472764,
    "timesteps": 243548217,
    "learntime": 0.19396169390529394,
    "sampletime": 8.618676929967478,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 698,
    "reward_mean": 1.858519101867301,
    "reward_max": 2.1978487161298563,
    "reward_min": 1.5279074122167466,
    "reward_std": 0.15846031114856052,
    "timesteps": 243908937,
    "learntime": 0.19848636304959655,
    "sampletime": 8.738216819008812,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 699,
    "reward_mean": 1.7863416524418307,
    "reward_max": 2.1581717584631392,
    "reward_min": 1.3858157820520998,
    "reward_std": 0.13854233636184696,
    "timesteps": 244269657,
    "learntime": 0.18537809886038303,
    "sampletime": 8.796653619036078,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 700,
    "reward_mean": 1.399023358528243,
    "reward_max": 2.1893602477741094,
    "reward_min": -7.031748287855987,
    "reward_std": 1.8540365117582156,
    "timesteps": 244629393,
    "learntime": 0.19185870490036905,
    "sampletime": 8.77163538406603,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 701,
    "reward_mean": 1.771515385238239,
    "reward_max": 2.0206674746675115,
    "reward_min": 1.4192504823158443,
    "reward_std": 0.12360484956911753,
    "timesteps": 244990113,
    "learntime": 0.18044024286791682,
    "sampletime": 8.608342899940908,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 702,
    "reward_mean": 1.7040489925762528,
    "reward_max": 2.0197517045801785,
    "reward_min": 1.3637365295311812,
    "reward_std": 0.13983055779668607,
    "timesteps": 245350833,
    "learntime": 0.18170076399110258,
    "sampletime": 8.666512347059324,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 703,
    "reward_mean": 0.535158548914239,
    "reward_max": 2.151168301898803,
    "reward_min": -7.313885987937367,
    "reward_std": 3.078599876558556,
    "timesteps": 245708979,
    "learntime": 0.17925230297259986,
    "sampletime": 8.714828375028446,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 704,
    "reward_mean": 1.7955023585137717,
    "reward_max": 2.0795641141153394,
    "reward_min": 1.4551351120203908,
    "reward_std": 0.14340375785014614,
    "timesteps": 246069699,
    "learntime": 0.19356936891563237,
    "sampletime": 8.947020082967356,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 705,
    "reward_mean": 1.4025193146439818,
    "reward_max": 2.2737634000897544,
    "reward_min": -7.083007307659667,
    "reward_std": 1.822264900899247,
    "timesteps": 246429507,
    "learntime": 0.18259769794531167,
    "sampletime": 8.70879655284807,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 706,
    "reward_mean": 1.0393602489686855,
    "reward_max": 2.1773879824241784,
    "reward_min": -7.079189962319412,
    "reward_std": 2.530197895044705,
    "timesteps": 246788403,
    "learntime": 0.23187893093563616,
    "sampletime": 8.672114006010816,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 707,
    "reward_mean": 1.4014180475921374,
    "reward_max": 2.2609977217260586,
    "reward_min": -6.964641280532255,
    "reward_std": 1.8563502128908296,
    "timesteps": 247148211,
    "learntime": 0.2365561481565237,
    "sampletime": 8.678828086005524,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 708,
    "reward_mean": 1.7830447097969717,
    "reward_max": 2.168434517621238,
    "reward_min": 1.4137348823246068,
    "reward_std": 0.16939157273225652,
    "timesteps": 247508931,
    "learntime": 0.18818137794733047,
    "sampletime": 8.800283003831282,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 709,
    "reward_mean": 1.7819531456796018,
    "reward_max": 2.0894084697744484,
    "reward_min": 1.46781491592992,
    "reward_std": 0.1414362741478087,
    "timesteps": 247869651,
    "learntime": 0.20111175696365535,
    "sampletime": 8.716364518040791,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 710,
    "reward_mean": 1.8201146912356614,
    "reward_max": 2.1293148701196025,
    "reward_min": 1.3301034273692578,
    "reward_std": 0.14721773325573956,
    "timesteps": 248230371,
    "learntime": 0.2340383769478649,
    "sampletime": 8.767360980855301,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 711,
    "reward_mean": 1.79430936153893,
    "reward_max": 2.1513222700097776,
    "reward_min": 1.4350789765966383,
    "reward_std": 0.15183444591344994,
    "timesteps": 248591091,
    "learntime": 0.17792883585207164,
    "sampletime": 8.912564833881333,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 712,
    "reward_mean": 1.7832569543348016,
    "reward_max": 2.0819561033259184,
    "reward_min": 1.41325450548902,
    "reward_std": 0.1400416342329905,
    "timesteps": 248951811,
    "learntime": 0.22694882680661976,
    "sampletime": 8.614341703010723,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 713,
    "reward_mean": 1.8374434417578356,
    "reward_max": 2.2872313705341734,
    "reward_min": 1.460523837094011,
    "reward_std": 0.17053938787032982,
    "timesteps": 249312531,
    "learntime": 0.20314749097451568,
    "sampletime": 8.762497975956649,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 714,
    "reward_mean": 1.884165025548116,
    "reward_max": 2.1528286382478314,
    "reward_min": 1.553016115715513,
    "reward_std": 0.15032503994015292,
    "timesteps": 249673251,
    "learntime": 0.1883446159772575,
    "sampletime": 8.723663025069982,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 715,
    "reward_mean": 1.822402454527064,
    "reward_max": 2.0870982303185297,
    "reward_min": 1.3881453490255125,
    "reward_std": 0.156828307028513,
    "timesteps": 250033971,
    "learntime": 0.2389968279749155,
    "sampletime": 8.636903326958418,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 716,
    "reward_mean": 1.8075355574225624,
    "reward_max": 2.232841151688867,
    "reward_min": 1.4381964886807956,
    "reward_std": 0.17809562207299176,
    "timesteps": 250394691,
    "learntime": 0.19149553100578487,
    "sampletime": 8.72704717097804,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 717,
    "reward_mean": 1.746784219197785,
    "reward_max": 2.0986085770568788,
    "reward_min": 1.3091973119069598,
    "reward_std": 0.16488969570568277,
    "timesteps": 250755411,
    "learntime": 0.18122294801287353,
    "sampletime": 8.648832235019654,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 718,
    "reward_mean": 1.500027724103201,
    "reward_max": 2.224722748363595,
    "reward_min": -15.997790768913658,
    "reward_std": 2.4775888306443545,
    "timesteps": 251114985,
    "learntime": 0.23783061001449823,
    "sampletime": 8.777768970932811,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 719,
    "reward_mean": 1.850480251814766,
    "reward_max": 2.3526058170739805,
    "reward_min": 1.5118426583040565,
    "reward_std": 0.16900572847013404,
    "timesteps": 251475705,
    "learntime": 0.1905228509567678,
    "sampletime": 8.785217356868088,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 720,
    "reward_mean": 1.800928165511559,
    "reward_max": 2.2996613493676024,
    "reward_min": 1.3658648602361065,
    "reward_std": 0.14910459523671346,
    "timesteps": 251836425,
    "learntime": 0.22655609296634793,
    "sampletime": 8.768391010118648,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 721,
    "reward_mean": 1.791851822008315,
    "reward_max": 2.1460368805564887,
    "reward_min": 1.3325748243627846,
    "reward_std": 0.15766992877411676,
    "timesteps": 252197145,
    "learntime": 0.1834728908725083,
    "sampletime": 8.969644504832104,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 722,
    "reward_mean": 1.4772003553547535,
    "reward_max": 2.1768822296536627,
    "reward_min": -6.970600068315187,
    "reward_std": 1.7656072870185362,
    "timesteps": 252556908,
    "learntime": 0.23771712183952332,
    "sampletime": 8.639897315064445,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 723,
    "reward_mean": 1.7858953534916504,
    "reward_max": 2.0281881861543853,
    "reward_min": 1.4911409644656928,
    "reward_std": 0.13068105006664044,
    "timesteps": 252917628,
    "learntime": 0.18504987005144358,
    "sampletime": 8.66623644484207,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 724,
    "reward_mean": 1.7675197647452696,
    "reward_max": 2.1103638777911455,
    "reward_min": 1.4636280247537359,
    "reward_std": 0.12524878061376735,
    "timesteps": 253278348,
    "learntime": 0.237250748090446,
    "sampletime": 8.7118739138823,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 725,
    "reward_mean": 1.7494325924010445,
    "reward_max": 2.0985588423456187,
    "reward_min": 1.3878939206479097,
    "reward_std": 0.13619463025584969,
    "timesteps": 253639068,
    "learntime": 0.1813117628917098,
    "sampletime": 8.74661968788132,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 726,
    "reward_mean": 1.7975196676941891,
    "reward_max": 2.277821014894772,
    "reward_min": 1.5074238013158625,
    "reward_std": 0.191501408783266,
    "timesteps": 253999788,
    "learntime": 0.2330760839395225,
    "sampletime": 8.716542503098026,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 727,
    "reward_mean": 1.7931129489436344,
    "reward_max": 2.0935116345115765,
    "reward_min": 1.4047278925268463,
    "reward_std": 0.172016202130454,
    "timesteps": 254360508,
    "learntime": 0.19307644199579954,
    "sampletime": 8.80278675397858,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 728,
    "reward_mean": 1.7451595736172572,
    "reward_max": 2.0485583571805317,
    "reward_min": 1.4192711348419584,
    "reward_std": 0.14633841784202278,
    "timesteps": 254721228,
    "learntime": 0.23281325190328062,
    "sampletime": 8.75544441700913,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 729,
    "reward_mean": 1.7943673649348992,
    "reward_max": 2.1244307021014586,
    "reward_min": 1.3472543346535064,
    "reward_std": 0.16340185616329958,
    "timesteps": 255081948,
    "learntime": 0.185307830106467,
    "sampletime": 8.756731281988323,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 730,
    "reward_mean": 1.7812684237980148,
    "reward_max": 2.0260777156570713,
    "reward_min": 1.4989325057337695,
    "reward_std": 0.1320118694664345,
    "timesteps": 255442668,
    "learntime": 0.23807271313853562,
    "sampletime": 8.738574323942885,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 731,
    "reward_mean": 1.752328532131683,
    "reward_max": 2.0881091998501975,
    "reward_min": 1.3807917707740789,
    "reward_std": 0.12450483859090915,
    "timesteps": 255803388,
    "learntime": 0.19127996684983373,
    "sampletime": 8.735220697941259,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 732,
    "reward_mean": 1.7731047772129778,
    "reward_max": 2.174775776899903,
    "reward_min": 1.421283421698411,
    "reward_std": 0.16621673142032228,
    "timesteps": 256164108,
    "learntime": 0.2501368410885334,
    "sampletime": 8.760984196094796,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 733,
    "reward_mean": 1.8245912324185325,
    "reward_max": 2.2103007802048293,
    "reward_min": 1.4933309736097138,
    "reward_std": 0.13794023828336704,
    "timesteps": 256524828,
    "learntime": 0.18872856814414263,
    "sampletime": 8.780392061918974,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 734,
    "reward_mean": 1.8101470186660267,
    "reward_max": 2.1653490400860744,
    "reward_min": 1.415436883806248,
    "reward_std": 0.14687150862538745,
    "timesteps": 256885548,
    "learntime": 0.23968562111258507,
    "sampletime": 8.79976466903463,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 735,
    "reward_mean": 1.4147439531134536,
    "reward_max": 2.257178343767815,
    "reward_min": -7.069527821774089,
    "reward_std": 1.830403419714242,
    "timesteps": 257245143,
    "learntime": 0.18559592589735985,
    "sampletime": 8.716026451205835,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 736,
    "reward_mean": 1.8686812396226675,
    "reward_max": 2.1223333254350654,
    "reward_min": 1.5282478143604772,
    "reward_std": 0.13594772422611168,
    "timesteps": 257605863,
    "learntime": 0.24718065094202757,
    "sampletime": 8.701622165041044,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 737,
    "reward_mean": 1.7813568299830882,
    "reward_max": 2.081491816825952,
    "reward_min": 1.4472881725382498,
    "reward_std": 0.14374393829432525,
    "timesteps": 257966583,
    "learntime": 0.18744537397287786,
    "sampletime": 8.672401953022927,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 738,
    "reward_mean": 1.8055610930403145,
    "reward_max": 2.1492708726842498,
    "reward_min": 1.4623308727362494,
    "reward_std": 0.13856953497334681,
    "timesteps": 258327303,
    "learntime": 0.2504887110553682,
    "sampletime": 8.688284915173426,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 739,
    "reward_mean": 0.09481195226828334,
    "reward_max": 2.0060558500064682,
    "reward_min": -16.47184263632605,
    "reward_std": 4.141508051236038,
    "timesteps": 258684102,
    "learntime": 0.198848987929523,
    "sampletime": 8.837392023997381,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 740,
    "reward_mean": 1.8523830723163506,
    "reward_max": 2.1612355186124166,
    "reward_min": 1.5844317711889717,
    "reward_std": 0.1551508332906066,
    "timesteps": 259044822,
    "learntime": 0.20006558508612216,
    "sampletime": 8.72379324096255,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 741,
    "reward_mean": 1.4042260362328416,
    "reward_max": 2.2122406873774394,
    "reward_min": -7.577045130494025,
    "reward_std": 1.9185606168506624,
    "timesteps": 259404588,
    "learntime": 0.19222938898019493,
    "sampletime": 8.638037002179772,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 742,
    "reward_mean": 1.8402643407704602,
    "reward_max": 2.2349909984817087,
    "reward_min": 1.475789473630189,
    "reward_std": 0.15127743262974944,
    "timesteps": 259765308,
    "learntime": 0.18447562609799206,
    "sampletime": 8.71271746000275,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 743,
    "reward_mean": 1.8109386023167158,
    "reward_max": 2.139774887516977,
    "reward_min": 1.457654237179227,
    "reward_std": 0.1501083994440284,
    "timesteps": 260126028,
    "learntime": 0.193423958029598,
    "sampletime": 8.680953403003514,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 744,
    "reward_mean": 1.8508589412898835,
    "reward_max": 2.2379856255605692,
    "reward_min": 1.5435503957172207,
    "reward_std": 0.16252672185315978,
    "timesteps": 260486748,
    "learntime": 0.18702052091248333,
    "sampletime": 8.827476911945269,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 745,
    "reward_mean": 1.8152396387635192,
    "reward_max": 2.2455340947490168,
    "reward_min": 1.5092922822663999,
    "reward_std": 0.16713575236766637,
    "timesteps": 260847468,
    "learntime": 0.19127960898913443,
    "sampletime": 8.778334158007056,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 746,
    "reward_mean": 1.7906263265708116,
    "reward_max": 2.162339676100984,
    "reward_min": 1.5126171433067694,
    "reward_std": 0.14095130310472806,
    "timesteps": 261208188,
    "learntime": 0.18744163680821657,
    "sampletime": 8.736300272867084,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 747,
    "reward_mean": 1.7801434463704215,
    "reward_max": 2.0748810815509353,
    "reward_min": 1.4701866065839886,
    "reward_std": 0.13401041479426562,
    "timesteps": 261568908,
    "learntime": 0.1873407601378858,
    "sampletime": 8.817288069985807,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 748,
    "reward_mean": 1.8075529866343314,
    "reward_max": 2.0991623931666683,
    "reward_min": 1.4435287684170877,
    "reward_std": 0.154376890119446,
    "timesteps": 261929628,
    "learntime": 0.18928207806311548,
    "sampletime": 8.827175816055387,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 749,
    "reward_mean": 1.7843192604366487,
    "reward_max": 2.147984684332075,
    "reward_min": 1.4149560878885832,
    "reward_std": 0.17472928415140287,
    "timesteps": 262290348,
    "learntime": 0.19241161714307964,
    "sampletime": 8.908903620904312,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 750,
    "reward_mean": 1.4871691634158795,
    "reward_max": 2.3301212815550207,
    "reward_min": -6.755905707382641,
    "reward_std": 1.785308849697127,
    "timesteps": 262649889,
    "learntime": 0.19529846985824406,
    "sampletime": 8.715324097080156,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 751,
    "reward_mean": 1.8654202134261992,
    "reward_max": 2.3666223244799736,
    "reward_min": 1.5353402441998873,
    "reward_std": 0.1783998085144636,
    "timesteps": 263010609,
    "learntime": 0.18628913792781532,
    "sampletime": 8.740324896993116,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 752,
    "reward_mean": 1.8494623071234264,
    "reward_max": 2.2887216643906507,
    "reward_min": 1.4722624512558609,
    "reward_std": 0.18061515497879804,
    "timesteps": 263371329,
    "learntime": 0.19681593612767756,
    "sampletime": 8.810442208079621,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 753,
    "reward_mean": 1.8013902787797451,
    "reward_max": 2.141950480814557,
    "reward_min": 1.5013880106041924,
    "reward_std": 0.14050959791012232,
    "timesteps": 263732049,
    "learntime": 0.19248999608680606,
    "sampletime": 8.825761791085824,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 754,
    "reward_mean": 1.8550426416328851,
    "reward_max": 2.198725816269868,
    "reward_min": 1.3903831087708076,
    "reward_std": 0.16752734310343642,
    "timesteps": 264092769,
    "learntime": 0.199873732868582,
    "sampletime": 8.845257854089141,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 755,
    "reward_mean": 1.8155042925690785,
    "reward_max": 2.2395507922162836,
    "reward_min": 1.4204739850564758,
    "reward_std": 0.19003283554652856,
    "timesteps": 264453489,
    "learntime": 0.19694502488709986,
    "sampletime": 8.867932062828913,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 756,
    "reward_mean": 1.869515554038307,
    "reward_max": 2.4488597961502445,
    "reward_min": 1.1353096956754032,
    "reward_std": 0.19319267342464422,
    "timesteps": 264814209,
    "learntime": 0.190529023995623,
    "sampletime": 8.862856839084998,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 757,
    "reward_mean": 1.8478006299409713,
    "reward_max": 2.2283464984917134,
    "reward_min": 1.3696860952980119,
    "reward_std": 0.1807814323494912,
    "timesteps": 265174929,
    "learntime": 0.1895629509817809,
    "sampletime": 8.806547624059021,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 758,
    "reward_mean": 1.910279878244748,
    "reward_max": 2.4670077915620294,
    "reward_min": 1.388310074407577,
    "reward_std": 0.20285271449242098,
    "timesteps": 265535649,
    "learntime": 0.19130714912898839,
    "sampletime": 8.685782874934375,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 759,
    "reward_mean": 1.8449593106046318,
    "reward_max": 2.1262322684862833,
    "reward_min": 1.5244437101236188,
    "reward_std": 0.134221174003158,
    "timesteps": 265896369,
    "learntime": 0.1905136329587549,
    "sampletime": 8.747005727840587,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 760,
    "reward_mean": 1.808692952986564,
    "reward_max": 2.2996488464713982,
    "reward_min": 1.5040399770527542,
    "reward_std": 0.1457494823434223,
    "timesteps": 266257089,
    "learntime": 0.18031078903004527,
    "sampletime": 8.745092189870775,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 761,
    "reward_mean": 1.8677890191935687,
    "reward_max": 2.2756342115303987,
    "reward_min": 1.5029332491456309,
    "reward_std": 0.14977980881032452,
    "timesteps": 266617809,
    "learntime": 0.1894029409158975,
    "sampletime": 8.707425359170884,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 762,
    "reward_mean": 1.8408963505588756,
    "reward_max": 2.3517678198863208,
    "reward_min": 1.427206427713494,
    "reward_std": 0.16143344550511735,
    "timesteps": 266978529,
    "learntime": 0.1955885379575193,
    "sampletime": 8.692176630022004,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 763,
    "reward_mean": 1.8458462626520165,
    "reward_max": 2.416668568763158,
    "reward_min": 1.5303943965065423,
    "reward_std": 0.16217689729030646,
    "timesteps": 267339249,
    "learntime": 0.19900938286446035,
    "sampletime": 8.569480035919696,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 764,
    "reward_mean": 1.3834302992147438,
    "reward_max": 2.121340423145956,
    "reward_min": -7.043169145317129,
    "reward_std": 1.868116225537776,
    "timesteps": 267698787,
    "learntime": 0.19210844789631665,
    "sampletime": 8.914923397125676,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 765,
    "reward_mean": 1.073088626126967,
    "reward_max": 2.1780705470873993,
    "reward_min": -7.138221757147803,
    "reward_std": 2.5039324078396623,
    "timesteps": 268057143,
    "learntime": 0.19981611310504377,
    "sampletime": 8.602651074994355,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 766,
    "reward_mean": 1.4318125443349192,
    "reward_max": 2.1068089693807317,
    "reward_min": -6.956513111987575,
    "reward_std": 1.7624234476460898,
    "timesteps": 268416681,
    "learntime": 0.1889438619837165,
    "sampletime": 8.81121582700871,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 767,
    "reward_mean": 1.835661624132051,
    "reward_max": 2.1962117651362645,
    "reward_min": 1.5192077040855723,
    "reward_std": 0.13857401528367141,
    "timesteps": 268777401,
    "learntime": 0.20090711512602866,
    "sampletime": 8.802576340036467,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 768,
    "reward_mean": 1.8614759752988554,
    "reward_max": 2.2590709826520934,
    "reward_min": 1.5787947712832975,
    "reward_std": 0.1278029410479298,
    "timesteps": 269138121,
    "learntime": 0.186114622047171,
    "sampletime": 8.717590817948803,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 769,
    "reward_mean": 1.0724970072661217,
    "reward_max": 2.201427088819344,
    "reward_min": -7.589342966640481,
    "reward_std": 2.538997335123792,
    "timesteps": 269496417,
    "learntime": 0.18787587294355035,
    "sampletime": 8.750907161971554,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 770,
    "reward_mean": 1.3492188095205064,
    "reward_max": 1.9823063791140363,
    "reward_min": -7.378927317490295,
    "reward_std": 1.9264865879092778,
    "timesteps": 269855925,
    "learntime": 0.19942404702305794,
    "sampletime": 8.694587197853252,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 771,
    "reward_mean": 1.709374613462995,
    "reward_max": 2.173808381384744,
    "reward_min": 1.213996318515536,
    "reward_std": 0.1733011903679378,
    "timesteps": 270216645,
    "learntime": 0.1859276790637523,
    "sampletime": 8.954835630953312,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 772,
    "reward_mean": 1.8066692074513124,
    "reward_max": 2.16113178060517,
    "reward_min": 1.4218008022920279,
    "reward_std": 0.19004563683435308,
    "timesteps": 270577365,
    "learntime": 0.1952003911137581,
    "sampletime": 8.740540732163936,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 773,
    "reward_mean": 1.7848282187422293,
    "reward_max": 2.167672181866663,
    "reward_min": 1.4739673479237916,
    "reward_std": 0.14073129109092544,
    "timesteps": 270938085,
    "learntime": 0.18352594296447933,
    "sampletime": 8.767047885106876,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 774,
    "reward_mean": 1.8462147858158102,
    "reward_max": 2.355084039797979,
    "reward_min": 1.5332335821268233,
    "reward_std": 0.15470847759581458,
    "timesteps": 271298805,
    "learntime": 0.193001447012648,
    "sampletime": 8.730376346968114,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 775,
    "reward_mean": 1.8167008260644824,
    "reward_max": 2.278953681290711,
    "reward_min": 1.3359069081524242,
    "reward_std": 0.18534459317541158,
    "timesteps": 271659525,
    "learntime": 0.19089286914095283,
    "sampletime": 8.819314254913479,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 776,
    "reward_mean": 1.7349004000974575,
    "reward_max": 2.10540276085499,
    "reward_min": 1.3019675685720722,
    "reward_std": 0.16636965701609036,
    "timesteps": 272020245,
    "learntime": 0.1863904967904091,
    "sampletime": 8.778047024970874,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 777,
    "reward_mean": 1.788121848363975,
    "reward_max": 2.1381858119716366,
    "reward_min": 1.434929109885792,
    "reward_std": 0.1411266900275324,
    "timesteps": 272380965,
    "learntime": 0.24210810102522373,
    "sampletime": 8.66674921195954,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 778,
    "reward_mean": 1.8868665367273074,
    "reward_max": 2.2575102571369774,
    "reward_min": 1.4044693206705012,
    "reward_std": 0.19389797919631963,
    "timesteps": 272741685,
    "learntime": 0.24685148987919092,
    "sampletime": 8.972486859885976,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 779,
    "reward_mean": 1.833970855764856,
    "reward_max": 2.149315343620288,
    "reward_min": 1.3775520677057382,
    "reward_std": 0.1480539531387859,
    "timesteps": 273102405,
    "learntime": 0.1878347850870341,
    "sampletime": 8.759089770028368,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 780,
    "reward_mean": 1.39548294018315,
    "reward_max": 2.1631847133200264,
    "reward_min": -7.236286300273303,
    "reward_std": 1.9112045990343742,
    "timesteps": 273461931,
    "learntime": 0.18532626586966217,
    "sampletime": 8.690477455034852,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 781,
    "reward_mean": 1.8414753790760106,
    "reward_max": 2.2536279148215783,
    "reward_min": 1.3236128952086053,
    "reward_std": 0.17660861287302146,
    "timesteps": 273822651,
    "learntime": 0.23353597312234342,
    "sampletime": 8.546418624930084,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 782,
    "reward_mean": 1.7606881786009412,
    "reward_max": 2.2657281019862454,
    "reward_min": 1.3544963448040293,
    "reward_std": 0.1605661262230312,
    "timesteps": 274183371,
    "learntime": 0.19970629084855318,
    "sampletime": 8.603018019814044,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 783,
    "reward_mean": 1.771538925440344,
    "reward_max": 2.238269633528857,
    "reward_min": 1.4834018589301372,
    "reward_std": 0.14985780993068365,
    "timesteps": 274544091,
    "learntime": 0.2495201739948243,
    "sampletime": 8.733657406875864,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 784,
    "reward_mean": 1.7824357669664257,
    "reward_max": 2.0670979444952904,
    "reward_min": 1.4298128969782142,
    "reward_std": 0.1400421461137658,
    "timesteps": 274904811,
    "learntime": 0.19126415299251676,
    "sampletime": 8.83139230706729,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 785,
    "reward_mean": 1.7795200278788672,
    "reward_max": 2.109407879877833,
    "reward_min": 1.5282231576517589,
    "reward_std": 0.12248547391910872,
    "timesteps": 275265531,
    "learntime": 0.2519438681192696,
    "sampletime": 8.747572256950662,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 786,
    "reward_mean": 1.3617935407751558,
    "reward_max": 2.074517120621343,
    "reward_min": -7.598069639728322,
    "reward_std": 1.905267427083317,
    "timesteps": 275625051,
    "learntime": 0.19167363410815597,
    "sampletime": 8.652053694007918,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 787,
    "reward_mean": 1.7685706333839675,
    "reward_max": 2.1942657954659235,
    "reward_min": 1.3067543010763585,
    "reward_std": 0.16972099780019653,
    "timesteps": 275985771,
    "learntime": 0.23310579801909626,
    "sampletime": 8.74652908113785,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 788,
    "reward_mean": 1.3232886531496932,
    "reward_max": 2.0639996302391697,
    "reward_min": -7.309635142234836,
    "reward_std": 1.856724504966042,
    "timesteps": 276345474,
    "learntime": 0.19056436396203935,
    "sampletime": 8.793707221979275,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 789,
    "reward_mean": 1.7855867280298277,
    "reward_max": 2.0967254835971554,
    "reward_min": 1.379171581686629,
    "reward_std": 0.1604080869068771,
    "timesteps": 276706194,
    "learntime": 0.23850320791825652,
    "sampletime": 8.8018505750224,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 790,
    "reward_mean": 1.8210613823888013,
    "reward_max": 2.2142463345627394,
    "reward_min": 1.3349846958951765,
    "reward_std": 0.16161123991786253,
    "timesteps": 277066914,
    "learntime": 0.19644965790212154,
    "sampletime": 8.790068490197882,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 791,
    "reward_mean": 1.8015669868220376,
    "reward_max": 2.2473268703624565,
    "reward_min": 1.4577774130334655,
    "reward_std": 0.14899964914197453,
    "timesteps": 277427634,
    "learntime": 0.2383648599497974,
    "sampletime": 8.713655083905905,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 792,
    "reward_mean": 1.8100029231156176,
    "reward_max": 2.192390783088435,
    "reward_min": 1.4396004963412183,
    "reward_std": 0.1706896165207232,
    "timesteps": 277788354,
    "learntime": 0.1979579848702997,
    "sampletime": 8.706544467015192,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 793,
    "reward_mean": 1.831752060969884,
    "reward_max": 2.1505380360917585,
    "reward_min": 1.5662049476064335,
    "reward_std": 0.14145058405568844,
    "timesteps": 278149074,
    "learntime": 0.2398484000004828,
    "sampletime": 8.83226236095652,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 794,
    "reward_mean": 1.899184860320936,
    "reward_max": 2.3664009414161673,
    "reward_min": 1.5512800721035354,
    "reward_std": 0.15370543892032623,
    "timesteps": 278509794,
    "learntime": 0.18730040383525193,
    "sampletime": 8.688535845838487,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 795,
    "reward_mean": 1.863483504912038,
    "reward_max": 2.202073602933632,
    "reward_min": 1.5809492382845305,
    "reward_std": 0.14141623515557641,
    "timesteps": 278870514,
    "learntime": 0.24731635814532638,
    "sampletime": 8.722829316044226,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 796,
    "reward_mean": 1.8529622450054193,
    "reward_max": 2.2867508126558547,
    "reward_min": 0.9751279115549853,
    "reward_std": 0.21871265905401008,
    "timesteps": 279231234,
    "learntime": 0.18911184812895954,
    "sampletime": 8.82355128112249,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 797,
    "reward_mean": 1.859069527049,
    "reward_max": 2.2274321567189537,
    "reward_min": 1.4710981469975308,
    "reward_std": 0.1726345555824753,
    "timesteps": 279591954,
    "learntime": 0.24476019106805325,
    "sampletime": 9.00403959886171,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 798,
    "reward_mean": 1.3458123848939636,
    "reward_max": 2.0472351818138503,
    "reward_min": -7.383747998752039,
    "reward_std": 1.878340505411754,
    "timesteps": 279951741,
    "learntime": 0.19146438990719616,
    "sampletime": 8.647637755144387,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 799,
    "reward_mean": 1.8066893158977502,
    "reward_max": 2.2190863275027346,
    "reward_min": 1.4114467917631035,
    "reward_std": 0.16614152248662373,
    "timesteps": 280312461,
    "learntime": 0.25356606184504926,
    "sampletime": 8.730480283033103,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 800,
    "reward_mean": 1.7839790451087083,
    "reward_max": 2.143098263559458,
    "reward_min": 1.518609364053794,
    "reward_std": 0.13322871063783376,
    "timesteps": 280673181,
    "learntime": 0.1885525130201131,
    "sampletime": 8.726769310887903,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 801,
    "reward_mean": 1.86830462856766,
    "reward_max": 2.173796260674749,
    "reward_min": 1.4048177096475303,
    "reward_std": 0.1242828509918945,
    "timesteps": 281033901,
    "learntime": 0.16811312385834754,
    "sampletime": 8.62953370809555,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 802,
    "reward_mean": 1.8773191736002128,
    "reward_max": 2.2644409105731995,
    "reward_min": 1.6062263884144163,
    "reward_std": 0.16380687525441928,
    "timesteps": 281394621,
    "learntime": 0.1966182158794254,
    "sampletime": 8.679837990086526,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 803,
    "reward_mean": 1.8770654723786113,
    "reward_max": 2.2305943830135857,
    "reward_min": 1.5263787125815818,
    "reward_std": 0.14453457458659308,
    "timesteps": 281755341,
    "learntime": 0.19361774204298854,
    "sampletime": 8.727540082996711,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 804,
    "reward_mean": 1.8832286775065221,
    "reward_max": 2.299175754787733,
    "reward_min": 1.531252862150058,
    "reward_std": 0.1503479067948476,
    "timesteps": 282116061,
    "learntime": 0.1967414270620793,
    "sampletime": 8.89082229998894,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 805,
    "reward_mean": 1.8079685317517047,
    "reward_max": 2.136890511843374,
    "reward_min": 1.3711831552632636,
    "reward_std": 0.1622760998243632,
    "timesteps": 282476781,
    "learntime": 0.19457690394483507,
    "sampletime": 8.650080689927563,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 806,
    "reward_mean": 1.7529275008777252,
    "reward_max": 2.2333166963314066,
    "reward_min": 1.507179553810573,
    "reward_std": 0.1566241933527993,
    "timesteps": 282837501,
    "learntime": 0.19402274512685835,
    "sampletime": 8.776798016857356,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 807,
    "reward_mean": 1.7503795171219176,
    "reward_max": 2.0953996200177305,
    "reward_min": 1.3992485411775577,
    "reward_std": 0.147442999452358,
    "timesteps": 283198221,
    "learntime": 0.1954324629623443,
    "sampletime": 8.790237826062366,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 808,
    "reward_mean": 1.8446872700338586,
    "reward_max": 2.2278125770034287,
    "reward_min": 1.5886670444231228,
    "reward_std": 0.12361033718206213,
    "timesteps": 283558941,
    "learntime": 0.19487062888219953,
    "sampletime": 8.671616706997156,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 809,
    "reward_mean": 1.8304380809093794,
    "reward_max": 2.2810945642448814,
    "reward_min": 1.4706146374891302,
    "reward_std": 0.1611059571085629,
    "timesteps": 283919661,
    "learntime": 0.1888606131542474,
    "sampletime": 8.767599125858396,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 810,
    "reward_mean": 1.9011530312129483,
    "reward_max": 2.1925959084635673,
    "reward_min": 1.5968981599717396,
    "reward_std": 0.13497343678895773,
    "timesteps": 284280381,
    "learntime": 0.23421072214841843,
    "sampletime": 8.666762351989746,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 811,
    "reward_mean": 1.9056707289246195,
    "reward_max": 2.442248337516499,
    "reward_min": 1.3524375838883704,
    "reward_std": 0.18112831776470123,
    "timesteps": 284641101,
    "learntime": 0.19221029803156853,
    "sampletime": 8.66463715606369,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 812,
    "reward_mean": 1.8376975159179534,
    "reward_max": 2.2662419848563826,
    "reward_min": 1.5346235215141784,
    "reward_std": 0.17292215785399181,
    "timesteps": 285001821,
    "learntime": 0.19124127714894712,
    "sampletime": 8.770321113057435,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 813,
    "reward_mean": 1.8770950076782917,
    "reward_max": 2.2107272416914268,
    "reward_min": 1.4723880841029844,
    "reward_std": 0.16016010379005194,
    "timesteps": 285362541,
    "learntime": 0.19207593705505133,
    "sampletime": 8.794662079075351,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 814,
    "reward_mean": 1.358423656031226,
    "reward_max": 2.164449762623528,
    "reward_min": -7.600588938955107,
    "reward_std": 1.976568063673195,
    "timesteps": 285722055,
    "learntime": 0.19912517606280744,
    "sampletime": 8.817245783982798,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 815,
    "reward_mean": 1.7546938724187406,
    "reward_max": 2.1265429166978147,
    "reward_min": 1.4588633523506147,
    "reward_std": 0.15951373630512672,
    "timesteps": 286082775,
    "learntime": 0.19763334491290152,
    "sampletime": 8.543854546966031,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 816,
    "reward_mean": 1.7466338096092127,
    "reward_max": 2.1589309111150197,
    "reward_min": 1.417892628885577,
    "reward_std": 0.14763829113190333,
    "timesteps": 286443495,
    "learntime": 0.19740877603180707,
    "sampletime": 8.71816632617265,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 817,
    "reward_mean": 1.8007436968601156,
    "reward_max": 2.1048856949335315,
    "reward_min": 1.4498169761200446,
    "reward_std": 0.14859962979141905,
    "timesteps": 286804215,
    "learntime": 0.19012567796744406,
    "sampletime": 8.694907215191051,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 818,
    "reward_mean": 1.7844721172045765,
    "reward_max": 2.054738842689952,
    "reward_min": 1.4066225457724832,
    "reward_std": 0.14648237812133028,
    "timesteps": 287164935,
    "learntime": 0.19671846088021994,
    "sampletime": 8.746190485078841,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 819,
    "reward_mean": 1.8162420441046625,
    "reward_max": 2.231387689328667,
    "reward_min": 1.3070981617784112,
    "reward_std": 0.15840344339008963,
    "timesteps": 287525655,
    "learntime": 0.1906777259428054,
    "sampletime": 8.757564023835585,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 820,
    "reward_mean": 1.8341206594435342,
    "reward_max": 2.183090228915466,
    "reward_min": 1.4349286840579487,
    "reward_std": 0.1668667095039615,
    "timesteps": 287886375,
    "learntime": 0.19329903088510036,
    "sampletime": 8.678835779195651,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 821,
    "reward_mean": 1.8258299435465795,
    "reward_max": 2.346159630546797,
    "reward_min": 1.433452426526468,
    "reward_std": 0.17177528559630104,
    "timesteps": 288247095,
    "learntime": 0.1887785019353032,
    "sampletime": 8.669525802135468,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 822,
    "reward_mean": 1.7482032150493656,
    "reward_max": 2.2120529745465523,
    "reward_min": 1.3833899357193844,
    "reward_std": 0.19302644664598814,
    "timesteps": 288607815,
    "learntime": 0.18933133012615144,
    "sampletime": 8.764682967914268,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 823,
    "reward_mean": 1.8597118027410182,
    "reward_max": 2.224100208820092,
    "reward_min": 1.425020890208099,
    "reward_std": 0.1680975732547101,
    "timesteps": 288968535,
    "learntime": 0.18482616217806935,
    "sampletime": 8.626753716962412,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 824,
    "reward_mean": 1.9281205719505867,
    "reward_max": 2.3499879386032565,
    "reward_min": 1.590413496318633,
    "reward_std": 0.15744616168435785,
    "timesteps": 289329255,
    "learntime": 0.19519233889877796,
    "sampletime": 8.639774347189814,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 825,
    "reward_mean": 1.4513185712936973,
    "reward_max": 2.4114130908063887,
    "reward_min": -7.1218359281845185,
    "reward_std": 1.834514398885158,
    "timesteps": 289688793,
    "learntime": 0.193633281160146,
    "sampletime": 8.667388472007588,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 826,
    "reward_mean": 1.117229984313811,
    "reward_max": 2.415434958550823,
    "reward_min": -6.956839782376352,
    "reward_std": 2.3942427820108736,
    "timesteps": 290047077,
    "learntime": 0.2034239899367094,
    "sampletime": 8.50846641114913,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 827,
    "reward_mean": 1.4763664528995961,
    "reward_max": 2.3143025573162666,
    "reward_min": -7.3647282942463725,
    "reward_std": 1.884493361896236,
    "timesteps": 290406555,
    "learntime": 0.19644125807099044,
    "sampletime": 8.75161345792003,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 828,
    "reward_mean": 1.883690469622723,
    "reward_max": 2.299250167204361,
    "reward_min": 1.497428794854907,
    "reward_std": 0.16392535539256703,
    "timesteps": 290767275,
    "learntime": 0.2003311119042337,
    "sampletime": 8.66702992003411,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 829,
    "reward_mean": 1.9113142620391876,
    "reward_max": 2.230832334287696,
    "reward_min": 1.5362990247932324,
    "reward_std": 0.16165622150055955,
    "timesteps": 291127995,
    "learntime": 0.19765872391872108,
    "sampletime": 8.750797844026238,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 830,
    "reward_mean": 1.5112120245877279,
    "reward_max": 2.463058195040722,
    "reward_min": -7.3386538730670585,
    "reward_std": 1.8325152245709528,
    "timesteps": 291487464,
    "learntime": 0.1987560570705682,
    "sampletime": 8.747871820116416,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 831,
    "reward_mean": 1.8903958485903984,
    "reward_max": 2.2113309119013085,
    "reward_min": 1.5571309398598672,
    "reward_std": 0.15011910695769848,
    "timesteps": 291848184,
    "learntime": 0.1987416900228709,
    "sampletime": 8.842880787095055,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 832,
    "reward_mean": 1.9014652066607085,
    "reward_max": 2.2222725569551005,
    "reward_min": 1.4440642798453491,
    "reward_std": 0.15974459081730047,
    "timesteps": 292208904,
    "learntime": 0.19512432720512152,
    "sampletime": 8.792280454887077,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 833,
    "reward_mean": 2.0539534855557697,
    "reward_max": 2.432215278174471,
    "reward_min": 1.6227256019831662,
    "reward_std": 0.172115671430344,
    "timesteps": 292569624,
    "learntime": 0.1946146609261632,
    "sampletime": 8.70571930008009,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 834,
    "reward_mean": 1.6082466880112618,
    "reward_max": 2.393593534858981,
    "reward_min": -6.65628275559919,
    "reward_std": 1.8200630130111441,
    "timesteps": 292929237,
    "learntime": 0.19913846696726978,
    "sampletime": 8.797889602836221,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 835,
    "reward_mean": 1.9413099440061574,
    "reward_max": 2.4267959444656597,
    "reward_min": 1.5851982392769308,
    "reward_std": 0.1732331622047143,
    "timesteps": 293289957,
    "learntime": 0.1934306479524821,
    "sampletime": 8.764099622843787,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 836,
    "reward_mean": 2.0221874834581413,
    "reward_max": 2.481827982534823,
    "reward_min": 1.5670627226530895,
    "reward_std": 0.1741395902312345,
    "timesteps": 293650677,
    "learntime": 0.19306838908232749,
    "sampletime": 8.912699023960158,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 837,
    "reward_mean": 2.075699763406102,
    "reward_max": 2.467001890290923,
    "reward_min": 1.7139135115307182,
    "reward_std": 0.1656361748997196,
    "timesteps": 294011397,
    "learntime": 0.1961502069607377,
    "sampletime": 8.783927460899577,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 838,
    "reward_mean": 1.6053573118071673,
    "reward_max": 2.3483422074544533,
    "reward_min": -6.783800875725734,
    "reward_std": 1.77979005268026,
    "timesteps": 294371037,
    "learntime": 0.1876695011742413,
    "sampletime": 8.741293256171048,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 839,
    "reward_mean": 2.058871849499326,
    "reward_max": 2.5830753041399537,
    "reward_min": 1.693620354491884,
    "reward_std": 0.1948200089989624,
    "timesteps": 294731757,
    "learntime": 0.1976403370499611,
    "sampletime": 8.781365394126624,
    "best_max_mean": 2.058871849499326,
    "best_max": 2.5830753041399537
  },
  {
    "gen": 840,
    "reward_mean": 2.099525188525133,
    "reward_max": 2.473302725155721,
    "reward_min": 1.6885421179220872,
    "reward_std": 0.16975640964029004,
    "timesteps": 295092477,
    "learntime": 0.2095558368600905,
    "sampletime": 8.8232507458888,
    "best_max_mean": 2.058871849499326,
    "best_max": 2.5830753041399537
  },
  {
    "gen": 841,
    "reward_mean": 2.161063338618405,
    "reward_max": 2.500245796535055,
    "reward_min": 1.7743825542036715,
    "reward_std": 0.16524081117951717,
    "timesteps": 295453197,
    "learntime": 0.2013468591030687,
    "sampletime": 8.73386527900584,
    "best_max_mean": 2.058871849499326,
    "best_max": 2.5830753041399537
  },
  {
    "gen": 842,
    "reward_mean": 1.6421437512420969,
    "reward_max": 2.5130533543779148,
    "reward_min": -6.721549919413081,
    "reward_std": 1.7862085652021784,
    "timesteps": 295812744,
    "learntime": 0.19262715289369226,
    "sampletime": 8.709718113997951,
    "best_max_mean": 2.058871849499326,
    "best_max": 2.5830753041399537
  },
  {
    "gen": 843,
    "reward_mean": 1.7436608506797286,
    "reward_max": 2.7250198722450105,
    "reward_min": -6.843153235477849,
    "reward_std": 1.8513831928031677,
    "timesteps": 296172333,
    "learntime": 0.20560434693470597,
    "sampletime": 8.919373735785484,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 844,
    "reward_mean": 2.0712896209047558,
    "reward_max": 2.505011651776094,
    "reward_min": 1.5738401931170771,
    "reward_std": 0.18714050114726075,
    "timesteps": 296533053,
    "learntime": 0.20614025299437344,
    "sampletime": 8.731259824009612,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 845,
    "reward_mean": 0.4420963542186888,
    "reward_max": 2.656277758004656,
    "reward_min": -14.20844099986587,
    "reward_std": 3.6377840336073506,
    "timesteps": 296889069,
    "learntime": 0.1982455370016396,
    "sampletime": 8.773138461168855,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 846,
    "reward_mean": 1.7250031694963999,
    "reward_max": 2.588000792526693,
    "reward_min": -6.701930321195646,
    "reward_std": 1.8088248095808004,
    "timesteps": 297248526,
    "learntime": 0.20969210495240986,
    "sampletime": 8.684023156994954,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 847,
    "reward_mean": 1.3332077051663191,
    "reward_max": 2.614833053264932,
    "reward_min": -6.8166216361392875,
    "reward_std": 2.536935702897685,
    "timesteps": 297606972,
    "learntime": 0.19956684997305274,
    "sampletime": 8.676666063023731,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 848,
    "reward_mean": 0.8760961752126922,
    "reward_max": 2.638411948773862,
    "reward_min": -15.400294656641291,
    "reward_std": 3.4254093348054715,
    "timesteps": 297964233,
    "learntime": 0.19333415501751006,
    "sampletime": 8.709534686990082,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 849,
    "reward_mean": 0.609930362310963,
    "reward_max": 2.8464966895399155,
    "reward_min": -6.911531994951833,
    "reward_std": 3.403068783111828,
    "timesteps": 298320180,
    "learntime": 0.19409151701256633,
    "sampletime": 8.683735897066072,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 850,
    "reward_mean": 1.7907172017515698,
    "reward_max": 2.6280875099358965,
    "reward_min": -6.420993326385295,
    "reward_std": 1.7147493924118378,
    "timesteps": 298679688,
    "learntime": 0.20368334301747382,
    "sampletime": 8.749917356995866,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 851,
    "reward_mean": 0.8293640680080099,
    "reward_max": 2.3939241692287085,
    "reward_min": -15.974180284915775,
    "reward_std": 3.4562036461137273,
    "timesteps": 299037306,
    "learntime": 0.19858261407352984,
    "sampletime": 8.618518475908786,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 852,
    "reward_mean": 0.4743980631017777,
    "reward_max": 2.50615733728751,
    "reward_min": -13.91832605101728,
    "reward_std": 3.591540831997186,
    "timesteps": 299393511,
    "learntime": 0.19743476784788072,
    "sampletime": 8.673812285065651,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 853,
    "reward_mean": 1.3600632062812217,
    "reward_max": 2.5813185490442243,
    "reward_min": -6.75414747181772,
    "reward_std": 2.532982302265576,
    "timesteps": 299752341,
    "learntime": 0.19912743801251054,
    "sampletime": 8.842981760157272,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 854,
    "reward_mean": 0.43416817898796506,
    "reward_max": 2.5354521977962095,
    "reward_min": -14.272499361405304,
    "reward_std": 3.5892058433773824,
    "timesteps": 300108474,
    "learntime": 0.19442481687292457,
    "sampletime": 8.620944405905902,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 855,
    "reward_mean": -0.3452289169972088,
    "reward_max": 2.4463979606657738,
    "reward_min": -14.097769489889393,
    "reward_std": 4.135209625575024,
    "timesteps": 300462477,
    "learntime": 0.19671761197969317,
    "sampletime": 8.685833716997877,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 856,
    "reward_mean": 0.906344291818256,
    "reward_max": 2.4684097405821124,
    "reward_min": -15.539322549143854,
    "reward_std": 3.7295536355150074,
    "timesteps": 300820401,
    "learntime": 0.1961041809991002,
    "sampletime": 8.7113648399245,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 857,
    "reward_mean": 1.4534137039757788,
    "reward_max": 2.6210208107398967,
    "reward_min": -6.620240888762942,
    "reward_std": 2.399736277054886,
    "timesteps": 301178772,
    "learntime": 0.19509474490769207,
    "sampletime": 8.74763738294132,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 858,
    "reward_mean": 0.8701813226363749,
    "reward_max": 2.55625842752973,
    "reward_min": -7.256471992341565,
    "reward_std": 3.094832970603802,
    "timesteps": 301535889,
    "learntime": 0.19471609499305487,
    "sampletime": 8.638522850116715,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 859,
    "reward_mean": 1.6504385828064407,
    "reward_max": 2.5216105806256444,
    "reward_min": -6.926422433079238,
    "reward_std": 1.8626394800651982,
    "timesteps": 301895481,
    "learntime": 0.20896068890579045,
    "sampletime": 8.758062042063102,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 860,
    "reward_mean": 0.882797794799332,
    "reward_max": 2.611978237347845,
    "reward_min": -14.389257736727211,
    "reward_std": 3.348678279016589,
    "timesteps": 302253240,
    "learntime": 0.1974867491517216,
    "sampletime": 8.60716347093694,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 861,
    "reward_mean": 0.8695284155144858,
    "reward_max": 2.480150960541017,
    "reward_min": -15.32332404150282,
    "reward_std": 3.352888402710527,
    "timesteps": 302610660,
    "learntime": 0.1926091390196234,
    "sampletime": 8.639319923939183,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 862,
    "reward_mean": 0.9040167831515579,
    "reward_max": 2.4605848956540046,
    "reward_min": -6.758122408522691,
    "reward_std": 2.8953156830219213,
    "timesteps": 302967987,
    "learntime": 0.2006376979406923,
    "sampletime": 8.799011938972399,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 863,
    "reward_mean": 0.5300261619278434,
    "reward_max": 2.672355155671317,
    "reward_min": -15.539296968099238,
    "reward_std": 3.705655375361127,
    "timesteps": 303324078,
    "learntime": 0.19606792484410107,
    "sampletime": 8.594963792944327,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 864,
    "reward_mean": 1.2350794120187567,
    "reward_max": 2.4874469240121844,
    "reward_min": -7.109258984376072,
    "reward_std": 2.628222469548667,
    "timesteps": 303682272,
    "learntime": 0.20774714183062315,
    "sampletime": 8.770038006827235,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 865,
    "reward_mean": 1.6026022296112474,
    "reward_max": 2.3109644573894235,
    "reward_min": -6.816320686757648,
    "reward_std": 1.7870009161014953,
    "timesteps": 304041846,
    "learntime": 0.19841264095157385,
    "sampletime": 8.723268804140389,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 866,
    "reward_mean": 0.8326013861322914,
    "reward_max": 2.416496360154818,
    "reward_min": -7.257145586514418,
    "reward_std": 3.020678468649745,
    "timesteps": 304399008,
    "learntime": 0.2004627820570022,
    "sampletime": 8.711910007987171,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 867,
    "reward_mean": -0.14645771932697477,
    "reward_max": 2.297914377813205,
    "reward_min": -15.669267444509778,
    "reward_std": 4.515098883966518,
    "timesteps": 304754127,
    "learntime": 0.1972554379608482,
    "sampletime": 8.73498387215659,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 868,
    "reward_mean": 0.37974206505785835,
    "reward_max": 2.276291086543066,
    "reward_min": -6.806539848229897,
    "reward_std": 3.2982106797251847,
    "timesteps": 305110401,
    "learntime": 0.19378086202777922,
    "sampletime": 8.633379538077861,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 869,
    "reward_mean": 1.8910009280270712,
    "reward_max": 2.27711319873823,
    "reward_min": 1.490245589977622,
    "reward_std": 0.1755790050177676,
    "timesteps": 305471121,
    "learntime": 0.19563284097239375,
    "sampletime": 8.674979896983132,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 870,
    "reward_mean": 1.11146437048995,
    "reward_max": 2.4293414529899784,
    "reward_min": -6.9175709397779,
    "reward_std": 2.4983818636505193,
    "timesteps": 305829579,
    "learntime": 0.1991462088190019,
    "sampletime": 8.754812533035874,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 871,
    "reward_mean": 1.810661224035487,
    "reward_max": 2.1509326319774638,
    "reward_min": 1.2523892453084964,
    "reward_std": 0.18885048035008492,
    "timesteps": 306190299,
    "learntime": 0.19625492091290653,
    "sampletime": 8.870937661034986,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 872,
    "reward_mean": 1.0546806374589748,
    "reward_max": 2.212530157292458,
    "reward_min": -7.180692963767796,
    "reward_std": 2.5299104808416306,
    "timesteps": 306548889,
    "learntime": 0.19244834198616445,
    "sampletime": 8.66165099083446,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 873,
    "reward_mean": 1.5471024640876134,
    "reward_max": 2.382624694620695,
    "reward_min": -7.062398154393042,
    "reward_std": 1.8495877505417784,
    "timesteps": 306908475,
    "learntime": 0.19279742683283985,
    "sampletime": 8.676837276900187,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 874,
    "reward_mean": 1.5078702261743906,
    "reward_max": 2.3924398595448677,
    "reward_min": -7.260111661798985,
    "reward_std": 1.8078844855938738,
    "timesteps": 307267932,
    "learntime": 0.19776285393163562,
    "sampletime": 8.687877027085051,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 875,
    "reward_mean": 1.4568523845799524,
    "reward_max": 2.227306436473911,
    "reward_min": -7.297702891286465,
    "reward_std": 1.887403073927811,
    "timesteps": 307627587,
    "learntime": 0.2005846940446645,
    "sampletime": 8.722993026021868,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 876,
    "reward_mean": 1.4913787630760418,
    "reward_max": 2.319965445397729,
    "reward_min": -14.386652647370484,
    "reward_std": 2.3076362414571934,
    "timesteps": 307987059,
    "learntime": 0.19777466589584947,
    "sampletime": 8.721725370036438,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 877,
    "reward_mean": 1.460581928097632,
    "reward_max": 2.108391656843715,
    "reward_min": -6.308328171507232,
    "reward_std": 1.7068767880269506,
    "timesteps": 308346618,
    "learntime": 0.199804849922657,
    "sampletime": 8.738136587897316,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 878,
    "reward_mean": 1.3957040602804565,
    "reward_max": 2.1357247686039145,
    "reward_min": -7.063218507167858,
    "reward_std": 1.828208948321239,
    "timesteps": 308706168,
    "learntime": 0.2432427150197327,
    "sampletime": 8.761633632937446,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 879,
    "reward_mean": 1.3858774869620605,
    "reward_max": 2.11645152223663,
    "reward_min": -7.141499293562173,
    "reward_std": 1.8614105381586556,
    "timesteps": 309065736,
    "learntime": 0.24538471922278404,
    "sampletime": 8.720510831102729,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 880,
    "reward_mean": 1.7217599207417216,
    "reward_max": 2.060117844549633,
    "reward_min": 1.3158254536789469,
    "reward_std": 0.16762584293405858,
    "timesteps": 309426456,
    "learntime": 0.2070877489168197,
    "sampletime": 8.71114797797054,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 881,
    "reward_mean": 1.8599037029978946,
    "reward_max": 2.127654957355733,
    "reward_min": 1.5992660960111964,
    "reward_std": 0.13546786992117846,
    "timesteps": 309787176,
    "learntime": 0.20160660496912897,
    "sampletime": 8.835992133943364,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 882,
    "reward_mean": 1.7727908635024436,
    "reward_max": 2.116386685132358,
    "reward_min": 1.5194960856734325,
    "reward_std": 0.1412236686599556,
    "timesteps": 310147896,
    "learntime": 0.24499797308817506,
    "sampletime": 8.68529169401154,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 883,
    "reward_mean": 1.7600646096906454,
    "reward_max": 2.1424999224096086,
    "reward_min": 1.380037654240201,
    "reward_std": 0.16344875834951592,
    "timesteps": 310508616,
    "learntime": 0.20254032802768052,
    "sampletime": 8.72408901504241,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 884,
    "reward_mean": 1.7954969357897363,
    "reward_max": 2.1670845189188213,
    "reward_min": 1.4021742535035353,
    "reward_std": 0.1518926475650741,
    "timesteps": 310869336,
    "learntime": 0.24307782691903412,
    "sampletime": 8.713530336041003,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 885,
    "reward_mean": 1.7751210565670807,
    "reward_max": 2.0552119750557742,
    "reward_min": 1.441251939040022,
    "reward_std": 0.11818278191568728,
    "timesteps": 311230056,
    "learntime": 0.204085152130574,
    "sampletime": 8.797361247939989,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 886,
    "reward_mean": 1.494912201628548,
    "reward_max": 2.284627372948854,
    "reward_min": -7.065968682881887,
    "reward_std": 1.7738922287166563,
    "timesteps": 311589744,
    "learntime": 0.25783065613359213,
    "sampletime": 8.685400906950235,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 887,
    "reward_mean": 1.7707761897523944,
    "reward_max": 2.1003940026866696,
    "reward_min": 1.3347912791747734,
    "reward_std": 0.17890450812164618,
    "timesteps": 311950464,
    "learntime": 0.20001702196896076,
    "sampletime": 8.715551868081093,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 888,
    "reward_mean": 1.873245440594296,
    "reward_max": 2.2067037372180454,
    "reward_min": 1.6327084315214015,
    "reward_std": 0.13480469040154755,
    "timesteps": 312311184,
    "learntime": 0.25416371901519597,
    "sampletime": 8.780900809215382,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 889,
    "reward_mean": 1.8541960657899887,
    "reward_max": 2.097647182194507,
    "reward_min": 1.4884096005636898,
    "reward_std": 0.14017539099888285,
    "timesteps": 312671904,
    "learntime": 0.20146610401570797,
    "sampletime": 8.86832161503844,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 890,
    "reward_mean": 1.9028478207859558,
    "reward_max": 2.177001765296557,
    "reward_min": 1.5402455048760815,
    "reward_std": 0.13448820006077145,
    "timesteps": 313032624,
    "learntime": 0.25182573893107474,
    "sampletime": 8.8417814578861,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 891,
    "reward_mean": 1.8129558020972723,
    "reward_max": 2.247142902353184,
    "reward_min": 1.4068863724612353,
    "reward_std": 0.16012780806103105,
    "timesteps": 313393344,
    "learntime": 0.19245507987216115,
    "sampletime": 8.73743371386081,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 892,
    "reward_mean": 1.8878439111179042,
    "reward_max": 2.2064739368577233,
    "reward_min": 1.6202417536564573,
    "reward_std": 0.12821951270170007,
    "timesteps": 313754064,
    "learntime": 0.26015681703574955,
    "sampletime": 8.783879689872265,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 893,
    "reward_mean": -0.9253925301115015,
    "reward_max": 2.280452378362743,
    "reward_min": -56.831721688177716,
    "reward_std": 7.957965060816822,
    "timesteps": 314105685,
    "learntime": 0.20281767309643328,
    "sampletime": 8.593154269037768,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 894,
    "reward_mean": 1.4658563007351297,
    "reward_max": 2.2435508981227117,
    "reward_min": -7.655066891044213,
    "reward_std": 1.9786693603663843,
    "timesteps": 314465121,
    "learntime": 0.23626745911315084,
    "sampletime": 8.795195032842457,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 895,
    "reward_mean": 1.863021928678645,
    "reward_max": 2.318888994806911,
    "reward_min": 1.4215979442550697,
    "reward_std": 0.1730901324708495,
    "timesteps": 314825841,
    "learntime": 0.19313801196403801,
    "sampletime": 8.78106172895059,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 896,
    "reward_mean": 1.5639937289532808,
    "reward_max": 2.285754692077522,
    "reward_min": -6.525448764983595,
    "reward_std": 1.776766728252857,
    "timesteps": 315185226,
    "learntime": 0.2529242248274386,
    "sampletime": 8.88647967716679,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 897,
    "reward_mean": 1.1692865257500111,
    "reward_max": 2.27332290523389,
    "reward_min": -16.320014915806524,
    "reward_std": 3.070871620147353,
    "timesteps": 315543450,
    "learntime": 0.21127695287577808,
    "sampletime": 8.73049047589302,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 898,
    "reward_mean": 1.5430962975945826,
    "reward_max": 2.3161090923716623,
    "reward_min": -7.562922085748252,
    "reward_std": 1.9941556440393573,
    "timesteps": 315902865,
    "learntime": 0.22659365995787084,
    "sampletime": 8.800870294915512,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 899,
    "reward_mean": 1.8823631835892942,
    "reward_max": 2.2284670597556127,
    "reward_min": 1.1157955496896472,
    "reward_std": 0.20923515140251997,
    "timesteps": 316263585,
    "learntime": 0.20884928316809237,
    "sampletime": 8.736560896970332,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 900,
    "reward_mean": -0.5191038597549401,
    "reward_max": 2.2116967868668387,
    "reward_min": -44.07778995823306,
    "reward_std": 6.496385161662748,
    "timesteps": 316616733,
    "learntime": 0.24445278500206769,
    "sampletime": 8.691931131994352,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 901,
    "reward_mean": -0.2580671872856282,
    "reward_max": 2.2078615737356633,
    "reward_min": -43.75972524387092,
    "reward_std": 6.555402102867387,
    "timesteps": 316970952,
    "learntime": 0.20669135102070868,
    "sampletime": 8.72984891012311,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 902,
    "reward_mean": 1.5047976691206648,
    "reward_max": 2.1742600308657094,
    "reward_min": -7.296025348516005,
    "reward_std": 1.915349246746754,
    "timesteps": 317330349,
    "learntime": 0.2678094529546797,
    "sampletime": 8.802680401830003,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 903,
    "reward_mean": -1.5031934997543783,
    "reward_max": 2.318348745737844,
    "reward_min": -25.683617643933484,
    "reward_std": 6.353584687242934,
    "timesteps": 317680812,
    "learntime": 0.19649541121907532,
    "sampletime": 8.786847713869065,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 904,
    "reward_mean": -4.015042976851546,
    "reward_max": 2.2623273185560118,
    "reward_min": -44.372904056946886,
    "reward_std": 9.39742511094861,
    "timesteps": 318023415,
    "learntime": 0.24516320996917784,
    "sampletime": 8.396701063029468,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 905,
    "reward_mean": -1.4929028276860767,
    "reward_max": 2.1564008814307387,
    "reward_min": -72.46407372292103,
    "reward_std": 9.87810406792208,
    "timesteps": 318373584,
    "learntime": 0.2002893358003348,
    "sampletime": 8.512410979019478,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 906,
    "reward_mean": -1.9063962475030407,
    "reward_max": 2.2443087559870682,
    "reward_min": -44.216999720366665,
    "reward_std": 7.719156407285215,
    "timesteps": 318722589,
    "learntime": 0.22444374486804008,
    "sampletime": 8.489913010969758,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 907,
    "reward_mean": 1.8994953739708127,
    "reward_max": 2.1995664872358427,
    "reward_min": 1.4740510514218625,
    "reward_std": 0.14361598094222383,
    "timesteps": 319083309,
    "learntime": 0.1996068360749632,
    "sampletime": 8.782301770988852,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 908,
    "reward_mean": 0.1175346512578049,
    "reward_max": 2.1577123437274373,
    "reward_min": -16.82008701049243,
    "reward_std": 3.934855737513783,
    "timesteps": 319438995,
    "learntime": 0.23877329984679818,
    "sampletime": 8.682255349121988,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 909,
    "reward_mean": 1.1310858596988496,
    "reward_max": 2.422293585773633,
    "reward_min": -7.42556560804334,
    "reward_std": 2.7151277567553262,
    "timesteps": 319797054,
    "learntime": 0.20681632705964148,
    "sampletime": 8.702038987074047,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 910,
    "reward_mean": 0.64459238177705,
    "reward_max": 2.2243873908753584,
    "reward_min": -25.362886816065647,
    "reward_std": 4.159351274903119,
    "timesteps": 320154123,
    "learntime": 0.2556104629766196,
    "sampletime": 8.787608101963997,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 911,
    "reward_mean": 1.9505512289057891,
    "reward_max": 2.351912458546307,
    "reward_min": 1.6997304065940104,
    "reward_std": 0.141019842736662,
    "timesteps": 320514843,
    "learntime": 0.2048839379567653,
    "sampletime": 8.775660558836535,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 912,
    "reward_mean": 1.5772551426019876,
    "reward_max": 2.282010170348886,
    "reward_min": -6.947116827682214,
    "reward_std": 1.838333778969378,
    "timesteps": 320874501,
    "learntime": 0.2059328791219741,
    "sampletime": 8.78158322093077,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 913,
    "reward_mean": 2.024884952341532,
    "reward_max": 2.4394030203552415,
    "reward_min": 1.7932516424281666,
    "reward_std": 0.12662549103732287,
    "timesteps": 321235221,
    "learntime": 0.193068205146119,
    "sampletime": 8.817892214981839,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 914,
    "reward_mean": 1.6008470518326288,
    "reward_max": 2.4776597512871796,
    "reward_min": -7.312587509563226,
    "reward_std": 1.9536801579381264,
    "timesteps": 321594615,
    "learntime": 0.19663792103528976,
    "sampletime": 8.704957344802096,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 915,
    "reward_mean": 1.5782389965570978,
    "reward_max": 2.3375191012235117,
    "reward_min": -6.967821647383091,
    "reward_std": 1.8602618089372929,
    "timesteps": 321954165,
    "learntime": 0.2091299940366298,
    "sampletime": 8.821318764938042,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 916,
    "reward_mean": 1.986790209769965,
    "reward_max": 2.248539067820685,
    "reward_min": 1.754539182490781,
    "reward_std": 0.10407720846158905,
    "timesteps": 322314885,
    "learntime": 0.2027531669009477,
    "sampletime": 8.67066174489446,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 917,
    "reward_mean": 2.018658341234973,
    "reward_max": 2.515531743475353,
    "reward_min": 1.6775388396309774,
    "reward_std": 0.17843611564718811,
    "timesteps": 322675605,
    "learntime": 0.1988311700988561,
    "sampletime": 8.8076740228571,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 918,
    "reward_mean": 1.9628089949694678,
    "reward_max": 2.3438891331527625,
    "reward_min": 1.5779768539424452,
    "reward_std": 0.15679342947549435,
    "timesteps": 323036325,
    "learntime": 0.19815275608561933,
    "sampletime": 8.750759923132136,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 919,
    "reward_mean": 1.5910505524237848,
    "reward_max": 2.3798585048465997,
    "reward_min": -6.9285637952826535,
    "reward_std": 1.771792877415144,
    "timesteps": 323395863,
    "learntime": 0.20236624008975923,
    "sampletime": 8.721121311187744,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 920,
    "reward_mean": 1.9894247923112132,
    "reward_max": 2.296210965804425,
    "reward_min": 1.6553994025796912,
    "reward_std": 0.13075013104720853,
    "timesteps": 323756583,
    "learntime": 0.19845243101008236,
    "sampletime": 8.865196452941746,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 921,
    "reward_mean": 1.9790452246230033,
    "reward_max": 2.2944813096740564,
    "reward_min": 1.7190764889934185,
    "reward_std": 0.11163915164623055,
    "timesteps": 324117303,
    "learntime": 0.20053982199169695,
    "sampletime": 8.729039064841345,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 922,
    "reward_mean": 2.037909726754277,
    "reward_max": 2.3387314781747643,
    "reward_min": 1.6213703611154184,
    "reward_std": 0.13322580950416812,
    "timesteps": 324478023,
    "learntime": 0.19643338792957366,
    "sampletime": 8.748309215065092,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 923,
    "reward_mean": 2.0079925738373525,
    "reward_max": 2.3305904760455785,
    "reward_min": 1.5897392531844516,
    "reward_std": 0.14605612797077538,
    "timesteps": 324838743,
    "learntime": 0.20179843506775796,
    "sampletime": 8.713168278802186,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 924,
    "reward_mean": 1.988470646265514,
    "reward_max": 2.277919569621159,
    "reward_min": 1.641324087253855,
    "reward_std": 0.1428959972658094,
    "timesteps": 325199463,
    "learntime": 0.2011708749923855,
    "sampletime": 8.759256670018658,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 925,
    "reward_mean": 1.9461328579292738,
    "reward_max": 2.181039463954439,
    "reward_min": 1.7219470524781173,
    "reward_std": 0.12314249424996096,
    "timesteps": 325560183,
    "learntime": 0.19521705387160182,
    "sampletime": 8.756425981177017,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 926,
    "reward_mean": 1.5685182496988936,
    "reward_max": 2.212847539755534,
    "reward_min": -6.687215867521997,
    "reward_std": 1.7747033776011711,
    "timesteps": 325919730,
    "learntime": 0.20307255699299276,
    "sampletime": 8.695503799943253,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 927,
    "reward_mean": 1.9901606215691863,
    "reward_max": 2.222145019581973,
    "reward_min": 1.662865197711099,
    "reward_std": 0.13538457154527184,
    "timesteps": 326280450,
    "learntime": 0.21950743696652353,
    "sampletime": 8.868837135843933,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 928,
    "reward_mean": 2.0036273539674743,
    "reward_max": 2.2890087677609907,
    "reward_min": 1.6339615462334613,
    "reward_std": 0.15332101566591352,
    "timesteps": 326641170,
    "learntime": 0.20824407087638974,
    "sampletime": 8.80603105807677,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 929,
    "reward_mean": 1.9847013593762015,
    "reward_max": 2.2211340597455567,
    "reward_min": 1.7147502720595844,
    "reward_std": 0.11312628499417207,
    "timesteps": 327001890,
    "learntime": 0.19383581005968153,
    "sampletime": 8.79082441306673,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 930,
    "reward_mean": 1.9913568717313692,
    "reward_max": 2.333845837006162,
    "reward_min": 1.6394861769028148,
    "reward_std": 0.13154387372404885,
    "timesteps": 327362610,
    "learntime": 0.19686619192361832,
    "sampletime": 8.734811911126599,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 931,
    "reward_mean": 1.8892412635377405,
    "reward_max": 2.1715567920896706,
    "reward_min": 1.5633839559902993,
    "reward_std": 0.134003678341809,
    "timesteps": 327723330,
    "learntime": 0.1970410409849137,
    "sampletime": 8.801707704085857,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 932,
    "reward_mean": 1.9715837546563217,
    "reward_max": 2.3835490131662485,
    "reward_min": 1.5802867794920894,
    "reward_std": 0.1670336476234922,
    "timesteps": 328084050,
    "learntime": 0.20334605290554464,
    "sampletime": 8.795451489975676,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 933,
    "reward_mean": 1.9196771591264765,
    "reward_max": 2.2794922597980363,
    "reward_min": 1.643819470748754,
    "reward_std": 0.12484688335177059,
    "timesteps": 328444770,
    "learntime": 0.19975715200416744,
    "sampletime": 8.868883548071608,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 934,
    "reward_mean": 1.9828537070078012,
    "reward_max": 2.4941554930725633,
    "reward_min": 1.5327499322152205,
    "reward_std": 0.172873716412773,
    "timesteps": 328805490,
    "learntime": 0.22546945489011705,
    "sampletime": 8.80876399599947,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 935,
    "reward_mean": 1.5465501656633598,
    "reward_max": 2.2908226255517383,
    "reward_min": -8.041191771686446,
    "reward_std": 1.9927559117930034,
    "timesteps": 329164851,
    "learntime": 0.1962414390873164,
    "sampletime": 8.760118351085111,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 936,
    "reward_mean": 1.9923708280431978,
    "reward_max": 2.376214143308582,
    "reward_min": 1.6416084975794407,
    "reward_std": 0.1387512041067656,
    "timesteps": 329525571,
    "learntime": 0.19185626204125583,
    "sampletime": 8.703760046046227,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 937,
    "reward_mean": 1.9620739046658342,
    "reward_max": 2.231287519052985,
    "reward_min": 1.6200943371725496,
    "reward_std": 0.13401354998709064,
    "timesteps": 329886291,
    "learntime": 0.2129835980013013,
    "sampletime": 8.754609117982909,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 938,
    "reward_mean": 1.9779234690031504,
    "reward_max": 2.3240484799612022,
    "reward_min": 1.5957576725279161,
    "reward_std": 0.13522035693124368,
    "timesteps": 330247011,
    "learntime": 0.2026228830218315,
    "sampletime": 8.974338961066678,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 939,
    "reward_mean": 2.0188424576488697,
    "reward_max": 2.3652269430211557,
    "reward_min": 1.6222657577653221,
    "reward_std": 0.12892341482743105,
    "timesteps": 330607731,
    "learntime": 0.20302493777126074,
    "sampletime": 8.78639759705402,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 940,
    "reward_mean": 1.995154664904311,
    "reward_max": 2.2174293193278958,
    "reward_min": 1.6528303432243048,
    "reward_std": 0.13632525119838276,
    "timesteps": 330968451,
    "learntime": 0.19913252792321146,
    "sampletime": 8.822585019050166,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 941,
    "reward_mean": 1.9896082243383533,
    "reward_max": 2.228838109488907,
    "reward_min": 1.6616489591791472,
    "reward_std": 0.12346900762349271,
    "timesteps": 331329171,
    "learntime": 0.2108119330368936,
    "sampletime": 8.744033287046477,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 942,
    "reward_mean": 2.0084857138792658,
    "reward_max": 2.3792790775187287,
    "reward_min": 1.7133832229301305,
    "reward_std": 0.1357014472226384,
    "timesteps": 331689891,
    "learntime": 0.1994642938952893,
    "sampletime": 8.78347520204261,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 943,
    "reward_mean": 1.9950088059332596,
    "reward_max": 2.3619794975736896,
    "reward_min": 1.6763961349409326,
    "reward_std": 0.15226905934413668,
    "timesteps": 332050611,
    "learntime": 0.18922208901494741,
    "sampletime": 8.746878230012953,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 944,
    "reward_mean": 2.0626108539604138,
    "reward_max": 2.374027192571452,
    "reward_min": 1.5963723210496163,
    "reward_std": 0.12960981907290997,
    "timesteps": 332411331,
    "learntime": 0.19994967384263873,
    "sampletime": 8.783688575029373,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 945,
    "reward_mean": 2.0165286646936043,
    "reward_max": 2.4123871627433027,
    "reward_min": 1.7012952144017819,
    "reward_std": 0.13890309633277861,
    "timesteps": 332772051,
    "learntime": 0.20000459905713797,
    "sampletime": 8.759043979924172,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 946,
    "reward_mean": 2.038630036528767,
    "reward_max": 2.3236621988824364,
    "reward_min": 1.5709779976565494,
    "reward_std": 0.12563676179900704,
    "timesteps": 333132771,
    "learntime": 0.196381556103006,
    "sampletime": 8.955161439953372,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 947,
    "reward_mean": 1.9971177228574823,
    "reward_max": 2.2937944963059347,
    "reward_min": 1.5621371760216471,
    "reward_std": 0.1460052448869989,
    "timesteps": 333493491,
    "learntime": 0.20243928278796375,
    "sampletime": 8.742443181108683,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 948,
    "reward_mean": 2.0333405218810596,
    "reward_max": 2.440215555030257,
    "reward_min": 1.7838726877411248,
    "reward_std": 0.13851125494427652,
    "timesteps": 333854211,
    "learntime": 0.20601143315434456,
    "sampletime": 8.887935251928866,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 949,
    "reward_mean": 2.1067309288949843,
    "reward_max": 2.3901355440065126,
    "reward_min": 1.6215671880856823,
    "reward_std": 0.14558196820037053,
    "timesteps": 334214931,
    "learntime": 0.25281064584851265,
    "sampletime": 8.792037789011374,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 950,
    "reward_mean": 1.9957705745704333,
    "reward_max": 2.3953897324108473,
    "reward_min": 1.778172024116483,
    "reward_std": 0.11905145545863127,
    "timesteps": 334575651,
    "learntime": 0.19970221491530538,
    "sampletime": 8.760310932062566,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 951,
    "reward_mean": 2.0448437996133926,
    "reward_max": 2.2822330567851723,
    "reward_min": 1.813269284262785,
    "reward_std": 0.12595045182927822,
    "timesteps": 334936371,
    "learntime": 0.20262447302229702,
    "sampletime": 8.695213709026575,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 952,
    "reward_mean": 2.0668231992114574,
    "reward_max": 2.4950151755968384,
    "reward_min": 1.7871402792754267,
    "reward_std": 0.13419370973009645,
    "timesteps": 335297091,
    "learntime": 0.20200574304908514,
    "sampletime": 8.860155769856647,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 953,
    "reward_mean": 2.067277340961052,
    "reward_max": 2.415330833684876,
    "reward_min": 1.8500947224877577,
    "reward_std": 0.1146186219334248,
    "timesteps": 335657811,
    "learntime": 0.2028379561379552,
    "sampletime": 8.784254148136824,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 954,
    "reward_mean": 2.043061486483447,
    "reward_max": 2.371373719444044,
    "reward_min": 1.7775155035196795,
    "reward_std": 0.134130242662189,
    "timesteps": 336018531,
    "learntime": 0.20615633903071284,
    "sampletime": 8.706690221093595,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 955,
    "reward_mean": 2.050363006207376,
    "reward_max": 2.37344357548246,
    "reward_min": 1.8124697844914095,
    "reward_std": 0.10282945779840127,
    "timesteps": 336379251,
    "learntime": 0.20000695902854204,
    "sampletime": 8.84271776699461,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 956,
    "reward_mean": 2.036481311544003,
    "reward_max": 2.269638788004431,
    "reward_min": 1.7278140992099027,
    "reward_std": 0.10998657450593648,
    "timesteps": 336739971,
    "learntime": 0.2118262890726328,
    "sampletime": 8.891679035965353,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 957,
    "reward_mean": 2.0402857571172075,
    "reward_max": 2.428110061915393,
    "reward_min": 1.623674421313667,
    "reward_std": 0.17148520247734228,
    "timesteps": 337100691,
    "learntime": 0.20614941813983023,
    "sampletime": 8.80225911992602,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 958,
    "reward_mean": 2.0121331243252993,
    "reward_max": 2.2265782781482395,
    "reward_min": 1.7147443634158746,
    "reward_std": 0.10569031607170803,
    "timesteps": 337461411,
    "learntime": 0.20512516400776803,
    "sampletime": 8.671578533947468,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 959,
    "reward_mean": 2.0018098679187695,
    "reward_max": 2.3258247434083956,
    "reward_min": 1.7741231458472357,
    "reward_std": 0.11509055857083243,
    "timesteps": 337822131,
    "learntime": 0.20480740815401077,
    "sampletime": 8.794009564211592,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 960,
    "reward_mean": 2.0183192802002026,
    "reward_max": 2.56124448671471,
    "reward_min": 1.6841434337547965,
    "reward_std": 0.1570147541150763,
    "timesteps": 338182851,
    "learntime": 0.19825225695967674,
    "sampletime": 8.795984657015651,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 961,
    "reward_mean": 2.070941188531805,
    "reward_max": 2.4451134699063677,
    "reward_min": 1.8035720478117978,
    "reward_std": 0.1369739753987854,
    "timesteps": 338543571,
    "learntime": 0.20254510105587542,
    "sampletime": 8.858674306888133,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 962,
    "reward_mean": 0.7756082895352225,
    "reward_max": 2.3531764836868985,
    "reward_min": -14.921064866310594,
    "reward_std": 3.404060001330503,
    "timesteps": 338900286,
    "learntime": 0.20197573117911816,
    "sampletime": 8.63609266700223,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 963,
    "reward_mean": 1.967920462843845,
    "reward_max": 2.307458258880421,
    "reward_min": 1.593531846033519,
    "reward_std": 0.1389454113463928,
    "timesteps": 339261006,
    "learntime": 0.20212716585956514,
    "sampletime": 8.989632052835077,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 964,
    "reward_mean": 2.0383743033126365,
    "reward_max": 2.3107506407311886,
    "reward_min": 1.7756798632670474,
    "reward_std": 0.11377524910974551,
    "timesteps": 339621726,
    "learntime": 0.2021752679720521,
    "sampletime": 8.762229589978233,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 965,
    "reward_mean": 2.008230099689332,
    "reward_max": 2.482559964422963,
    "reward_min": 1.7756785894546019,
    "reward_std": 0.13453549074421148,
    "timesteps": 339982446,
    "learntime": 0.20667984685860574,
    "sampletime": 8.800811610883102,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 966,
    "reward_mean": 0.7755027494900333,
    "reward_max": 2.45222417514235,
    "reward_min": -23.394125924704394,
    "reward_std": 3.9809449622718254,
    "timesteps": 340339149,
    "learntime": 0.20224164193496108,
    "sampletime": 8.742726942058653,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 967,
    "reward_mean": 2.0091464197966733,
    "reward_max": 2.280471598121835,
    "reward_min": 1.7370233467822371,
    "reward_std": 0.11097077265913274,
    "timesteps": 340699869,
    "learntime": 0.20482786116190255,
    "sampletime": 8.83139933901839,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 968,
    "reward_mean": 0.025532419974485743,
    "reward_max": 2.4749054441993135,
    "reward_min": -48.56665675437156,
    "reward_std": 7.059927386206668,
    "timesteps": 341053947,
    "learntime": 0.20115114492364228,
    "sampletime": 8.651957836002111,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 969,
    "reward_mean": -0.06474283916289925,
    "reward_max": 2.407849629037727,
    "reward_min": -25.70871177985629,
    "reward_std": 5.086232614007527,
    "timesteps": 341408025,
    "learntime": 0.21700610406696796,
    "sampletime": 8.566771283978596,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 970,
    "reward_mean": 2.037130350335959,
    "reward_max": 2.298530539556142,
    "reward_min": 1.6187261039297212,
    "reward_std": 0.1321286332306511,
    "timesteps": 341768745,
    "learntime": 0.1942544139456004,
    "sampletime": 8.983158940915018,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 971,
    "reward_mean": -0.4869551933900923,
    "reward_max": 2.2948474192385064,
    "reward_min": -34.653691877689475,
    "reward_std": 6.093628807006116,
    "timesteps": 342121758,
    "learntime": 0.20800299500115216,
    "sampletime": 8.68770709587261,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 972,
    "reward_mean": 1.9891446913980573,
    "reward_max": 2.4370883073782093,
    "reward_min": 1.6483893601795274,
    "reward_std": 0.15418712721858355,
    "timesteps": 342482478,
    "learntime": 0.20537861692719162,
    "sampletime": 8.696809658082202,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 973,
    "reward_mean": 1.515174220319939,
    "reward_max": 2.2043726150736647,
    "reward_min": -7.544031322686794,
    "reward_std": 1.9706988923701019,
    "timesteps": 342841866,
    "learntime": 0.21216275892220438,
    "sampletime": 8.69295062799938,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 974,
    "reward_mean": 2.018874720752273,
    "reward_max": 2.3745882854528797,
    "reward_min": 1.5371209103984484,
    "reward_std": 0.1847771354413393,
    "timesteps": 343202586,
    "learntime": 0.20138463703915477,
    "sampletime": 8.803363936953247,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 975,
    "reward_mean": 2.050478381576055,
    "reward_max": 2.37728013267747,
    "reward_min": 1.8163877623508453,
    "reward_std": 0.1273262698586842,
    "timesteps": 343563306,
    "learntime": 0.2043806640431285,
    "sampletime": 8.812616732902825,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 976,
    "reward_mean": 1.6493230194638153,
    "reward_max": 2.5705060435910547,
    "reward_min": -7.335942272280318,
    "reward_std": 1.9405712802754498,
    "timesteps": 343922697,
    "learntime": 0.19557322305627167,
    "sampletime": 8.731211388949305,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 977,
    "reward_mean": 2.0401918993125916,
    "reward_max": 2.3543599326812608,
    "reward_min": 1.7500549141194706,
    "reward_std": 0.12048883717712092,
    "timesteps": 344283417,
    "learntime": 0.20567355398088694,
    "sampletime": 9.026431489968672,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 978,
    "reward_mean": 0.355239651138657,
    "reward_max": 2.6956026499498273,
    "reward_min": -31.930194234422142,
    "reward_std": 5.054353878413024,
    "timesteps": 344638818,
    "learntime": 0.20847308286465704,
    "sampletime": 8.695777022046968,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 979,
    "reward_mean": 1.6315889245963813,
    "reward_max": 2.4899843045030545,
    "reward_min": -6.796942216083125,
    "reward_std": 1.8223879641358165,
    "timesteps": 344998350,
    "learntime": 0.20743262791074812,
    "sampletime": 8.803144169040024,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 980,
    "reward_mean": 2.0731866687982574,
    "reward_max": 2.5546710248325097,
    "reward_min": 1.6219151247102557,
    "reward_std": 0.1764038768921995,
    "timesteps": 345359070,
    "learntime": 0.2067122650332749,
    "sampletime": 8.73181480797939,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 981,
    "reward_mean": 2.1000777883152795,
    "reward_max": 2.6728436180415085,
    "reward_min": 1.5810760000269044,
    "reward_std": 0.19319982589449997,
    "timesteps": 345719790,
    "learntime": 0.20450729504227638,
    "sampletime": 8.728781888028607,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 982,
    "reward_mean": 1.9827050224086862,
    "reward_max": 2.3730910752377805,
    "reward_min": 1.6081922223339908,
    "reward_std": 0.1537302335755485,
    "timesteps": 346080510,
    "learntime": 0.20570024498738348,
    "sampletime": 8.774610715918243,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 983,
    "reward_mean": 2.073521373468882,
    "reward_max": 2.3789202620550456,
    "reward_min": 1.7333608702421308,
    "reward_std": 0.16365854139568947,
    "timesteps": 346441230,
    "learntime": 0.20533461892046034,
    "sampletime": 8.860790529986843,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 984,
    "reward_mean": 1.370767082182955,
    "reward_max": 2.6974022518123864,
    "reward_min": -6.765358581961749,
    "reward_std": 2.5613363016606026,
    "timesteps": 346799703,
    "learntime": 0.20243249903433025,
    "sampletime": 8.675066126976162,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 985,
    "reward_mean": 1.7010666763350468,
    "reward_max": 2.6968377327106645,
    "reward_min": -6.972954729757148,
    "reward_std": 1.8223892823399208,
    "timesteps": 347159649,
    "learntime": 0.20688926917500794,
    "sampletime": 8.773329675896093,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 986,
    "reward_mean": 0.21908888634454277,
    "reward_max": 3.0247728231382394,
    "reward_min": -43.293180519441556,
    "reward_std": 6.503788240962341,
    "timesteps": 347513823,
    "learntime": 0.1945127840153873,
    "sampletime": 8.861240701982751,
    "best_max_mean": 0.21908888634454277,
    "best_max": 3.0247728231382394
  },
  {
    "gen": 987,
    "reward_mean": 2.221008461714275,
    "reward_max": 2.7665517764875047,
    "reward_min": 1.8077450058542888,
    "reward_std": 0.23423394069410705,
    "timesteps": 347874543,
    "learntime": 0.2506897838320583,
    "sampletime": 8.970462661003694,
    "best_max_mean": 0.21908888634454277,
    "best_max": 3.0247728231382394
  },
  {
    "gen": 988,
    "reward_mean": 1.761744857456289,
    "reward_max": 3.0462437489662637,
    "reward_min": -7.519939049644041,
    "reward_std": 1.9330622220985694,
    "timesteps": 348234621,
    "learntime": 0.21274659200571477,
    "sampletime": 8.780794029124081,
    "best_max_mean": 1.761744857456289,
    "best_max": 3.0462437489662637
  },
  {
    "gen": 989,
    "reward_mean": 2.2967302355793926,
    "reward_max": 2.779941788878093,
    "reward_min": 1.7830589912999912,
    "reward_std": 0.22832840648933783,
    "timesteps": 348595341,
    "learntime": 0.20460441010072827,
    "sampletime": 8.814936725888401,
    "best_max_mean": 1.761744857456289,
    "best_max": 3.0462437489662637
  },
  {
    "gen": 990,
    "reward_mean": 2.2407494287564713,
    "reward_max": 2.8782800980972927,
    "reward_min": 1.8528144366173345,
    "reward_std": 0.23630007699592487,
    "timesteps": 348956061,
    "learntime": 0.19505771016702056,
    "sampletime": 8.748663628008217,
    "best_max_mean": 1.761744857456289,
    "best_max": 3.0462437489662637
  },
  {
    "gen": 991,
    "reward_mean": 2.3979669700965105,
    "reward_max": 3.354699164844172,
    "reward_min": 1.8048902262946458,
    "reward_std": 0.3527277997379734,
    "timesteps": 349316781,
    "learntime": 0.1973267630673945,
    "sampletime": 8.84762457688339,
    "best_max_mean": 2.3979669700965105,
    "best_max": 3.354699164844172
  },
  {
    "gen": 992,
    "reward_mean": 2.5810795025413036,
    "reward_max": 3.6058097556762516,
    "reward_min": 1.8261816850157815,
    "reward_std": 0.40038551050427723,
    "timesteps": 349677501,
    "learntime": 0.21922439918853343,
    "sampletime": 8.832573443185538,
    "best_max_mean": 2.5810795025413036,
    "best_max": 3.6058097556762516
  },
  {
    "gen": 993,
    "reward_mean": 2.029353227860674,
    "reward_max": 3.338584580613919,
    "reward_min": -6.755547066049821,
    "reward_std": 1.9357577390798926,
    "timesteps": 350036880,
    "learntime": 0.22357625304721296,
    "sampletime": 8.829742077039555,
    "best_max_mean": 2.5810795025413036,
    "best_max": 3.6058097556762516
  },
  {
    "gen": 994,
    "reward_mean": 2.704639808718173,
    "reward_max": 3.3669189532449693,
    "reward_min": 2.0407560579231774,
    "reward_std": 0.33436780894939283,
    "timesteps": 350397600,
    "learntime": 0.24922235100530088,
    "sampletime": 8.799453761894256,
    "best_max_mean": 2.5810795025413036,
    "best_max": 3.6058097556762516
  },
  {
    "gen": 995,
    "reward_mean": 1.5895394345748506,
    "reward_max": 3.737301921773572,
    "reward_min": -6.831432988909499,
    "reward_std": 3.156505817096844,
    "timesteps": 350755389,
    "learntime": 0.21291276603005826,
    "sampletime": 8.709128601010889,
    "best_max_mean": 1.5895394345748506,
    "best_max": 3.737301921773572
  },
  {
    "gen": 996,
    "reward_mean": 2.431205130532,
    "reward_max": 4.297030082131666,
    "reward_min": -6.645982099247211,
    "reward_std": 2.0199415180927685,
    "timesteps": 351115464,
    "learntime": 0.2546015039552003,
    "sampletime": 8.942358396947384,
    "best_max_mean": 2.431205130532,
    "best_max": 4.297030082131666
  },
  {
    "gen": 997,
    "reward_mean": 2.30108739223557,
    "reward_max": 3.9422323696247354,
    "reward_min": -7.228842272652513,
    "reward_std": 2.6995081465438604,
    "timesteps": 351474636,
    "learntime": 0.21918567805550992,
    "sampletime": 8.771539381006733,
    "best_max_mean": 2.431205130532,
    "best_max": 4.297030082131666
  },
  {
    "gen": 998,
    "reward_mean": 3.138821190030484,
    "reward_max": 4.037876951349474,
    "reward_min": 2.5356073878620804,
    "reward_std": 0.34550179504695805,
    "timesteps": 351835356,
    "learntime": 0.2638202589005232,
    "sampletime": 8.862011606106535,
    "best_max_mean": 2.431205130532,
    "best_max": 4.297030082131666
  },
  {
    "gen": 999,
    "reward_mean": 2.019739532884566,
    "reward_max": 4.004165569397928,
    "reward_min": -15.560689621181654,
    "reward_std": 3.6415538205825357,
    "timesteps": 352193622,
    "learntime": 0.2009182299952954,
    "sampletime": 8.729837493039668,
    "best_max_mean": 2.431205130532,
    "best_max": 4.297030082131666
  },
  {
    "gen": 1000,
    "reward_mean": -0.38326145188591765,
    "reward_max": 4.942607709126383,
    "reward_min": -42.911911682239875,
    "reward_std": 7.432384335666449,
    "timesteps": 352545072,
    "learntime": 0.24202015507034957,
    "sampletime": 8.583843489876017,
    "best_max_mean": -0.38326145188591765,
    "best_max": 4.942607709126383
  },
  {
    "gen": 1001,
    "reward_mean": 1.926951679972822,
    "reward_max": 4.9839519419615605,
    "reward_min": -13.117347136510949,
    "reward_std": 3.8340876607203374,
    "timesteps": 352902195,
    "learntime": 0.11182131990790367,
    "sampletime": 8.70217459090054,
    "best_max_mean": 1.926951679972822,
    "best_max": 4.9839519419615605
  },
  {
    "gen": 1002,
    "reward_mean": 2.2845884951309787,
    "reward_max": 5.275274546818706,
    "reward_min": -6.077934265401302,
    "reward_std": 3.5447729116590057,
    "timesteps": 353260098,
    "learntime": 0.26539470814168453,
    "sampletime": 8.743376115104184,
    "best_max_mean": 2.2845884951309787,
    "best_max": 5.275274546818706
  },
  {
    "gen": 1003,
    "reward_mean": 2.3901714223744257,
    "reward_max": 5.019482718858246,
    "reward_min": -15.091897645107984,
    "reward_std": 4.190453048422489,
    "timesteps": 353618358,
    "learntime": 0.2514700060710311,
    "sampletime": 8.76513236691244,
    "best_max_mean": 2.2845884951309787,
    "best_max": 5.275274546818706
  },
  {
    "gen": 1004,
    "reward_mean": 0.21460248051423103,
    "reward_max": 6.066502835841453,
    "reward_min": -43.20852722363745,
    "reward_std": 7.320688206969386,
    "timesteps": 353969952,
    "learntime": 0.20841591316275299,
    "sampletime": 8.74903783807531,
    "best_max_mean": 0.21460248051423103,
    "best_max": 6.066502835841453
  },
  {
    "gen": 1005,
    "reward_mean": 1.4715375733918123,
    "reward_max": 5.184157814694721,
    "reward_min": -13.855902163779264,
    "reward_std": 4.44667635047519,
    "timesteps": 354324753,
    "learntime": 0.2823342839255929,
    "sampletime": 8.77175336307846,
    "best_max_mean": 0.21460248051423103,
    "best_max": 6.066502835841453
  },
  {
    "gen": 1006,
    "reward_mean": -0.2380303207686824,
    "reward_max": 5.431120441769683,
    "reward_min": -13.632482639429243,
    "reward_std": 5.564674812152565,
    "timesteps": 354679155,
    "learntime": 0.2082646198105067,
    "sampletime": 8.698541725985706,
    "best_max_mean": 0.21460248051423103,
    "best_max": 6.066502835841453
  },
  {
    "gen": 1007,
    "reward_mean": 0.7340963177198528,
    "reward_max": 5.918060875716477,
    "reward_min": -24.257492124106545,
    "reward_std": 5.6450087211588675,
    "timesteps": 355031517,
    "learntime": 0.24178620893508196,
    "sampletime": 8.642178006004542,
    "best_max_mean": 0.21460248051423103,
    "best_max": 6.066502835841453
  },
  {
    "gen": 1008,
    "reward_mean": -0.8147091826303456,
    "reward_max": 5.386361034036695,
    "reward_min": -24.00720260081333,
    "reward_std": 7.303707213037104,
    "timesteps": 355382271,
    "learntime": 0.20726541290059686,
    "sampletime": 8.600865343119949,
    "best_max_mean": 0.21460248051423103,
    "best_max": 6.066502835841453
  },
  {
    "gen": 1009,
    "reward_mean": -0.9267723086079837,
    "reward_max": 6.837641460701087,
    "reward_min": -22.628820087443195,
    "reward_std": 7.106361013194756,
    "timesteps": 355732488,
    "learntime": 0.2645624370779842,
    "sampletime": 8.630387429147959,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1010,
    "reward_mean": -2.2414125104183746,
    "reward_max": 6.117647428749914,
    "reward_min": -32.31566099356507,
    "reward_std": 8.841586196765236,
    "timesteps": 356079927,
    "learntime": 0.217455442994833,
    "sampletime": 8.64747611200437,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1011,
    "reward_mean": -5.195053268267271,
    "reward_max": 6.474226015725761,
    "reward_min": -49.29696696370868,
    "reward_std": 12.403000520221807,
    "timesteps": 356419980,
    "learntime": 0.26463609701022506,
    "sampletime": 8.44918665708974,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1012,
    "reward_mean": -7.088584989037912,
    "reward_max": 6.738643723131845,
    "reward_min": -45.11797021295124,
    "reward_std": 10.334546763678619,
    "timesteps": 356755515,
    "learntime": 0.20898993290029466,
    "sampletime": 8.487715349067003,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1013,
    "reward_mean": -8.769019123839103,
    "reward_max": 5.850720861950483,
    "reward_min": -41.964722006680496,
    "reward_std": 11.065798404086442,
    "timesteps": 357088812,
    "learntime": 0.23683224595151842,
    "sampletime": 8.522506191162392,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1014,
    "reward_mean": -1.6698604938632746,
    "reward_max": 6.167895697529963,
    "reward_min": -30.71116538462935,
    "reward_std": 7.696379696283118,
    "timesteps": 357436101,
    "learntime": 0.2751048789359629,
    "sampletime": 8.542114447802305,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1015,
    "reward_mean": -4.621323181658537,
    "reward_max": 5.509890899690311,
    "reward_min": -23.599714632117845,
    "reward_std": 8.561114734075705,
    "timesteps": 357781953,
    "learntime": 0.2069725061301142,
    "sampletime": 8.531666370108724,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1016,
    "reward_mean": -7.783931494552329,
    "reward_max": 6.073918677630096,
    "reward_min": -40.701413310055315,
    "reward_std": 12.353745549146364,
    "timesteps": 358116561,
    "learntime": 0.21239732299000025,
    "sampletime": 8.351802451070398,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1017,
    "reward_mean": -4.0758274345198,
    "reward_max": 6.17180767480992,
    "reward_min": -33.07819209983714,
    "reward_std": 9.261159981894425,
    "timesteps": 358456461,
    "learntime": 0.2541068329010159,
    "sampletime": 8.491845335112885,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1018,
    "reward_mean": -2.213648865130928,
    "reward_max": 6.556140648349273,
    "reward_min": -23.750293130205,
    "reward_std": 8.24763745911315,
    "timesteps": 358802316,
    "learntime": 0.19868211494758725,
    "sampletime": 8.61025563091971,
    "best_max_mean": -0.9267723086079837,
    "best_max": 6.837641460701087
  },
  {
    "gen": 1019,
    "reward_mean": -0.1261346636593036,
    "reward_max": 7.682765036567367,
    "reward_min": -21.775204744261412,
    "reward_std": 7.131199806232093,
    "timesteps": 359153295,
    "learntime": 0.25438480405136943,
    "sampletime": 8.617145208176225,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1020,
    "reward_mean": 0.6411029657498475,
    "reward_max": 6.266791829598978,
    "reward_min": -14.45445039307798,
    "reward_std": 5.750722644845293,
    "timesteps": 359505411,
    "learntime": 0.210805183975026,
    "sampletime": 8.83683466608636,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1021,
    "reward_mean": -2.5894937034111196,
    "reward_max": 6.123849506285324,
    "reward_min": -45.59795909517562,
    "reward_std": 8.774652353950342,
    "timesteps": 359855331,
    "learntime": 0.2683392148464918,
    "sampletime": 8.748562610941008,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1022,
    "reward_mean": -1.8935126030790188,
    "reward_max": 5.953434712648618,
    "reward_min": -31.806210807334125,
    "reward_std": 8.011036637068475,
    "timesteps": 360202062,
    "learntime": 0.21483769896440208,
    "sampletime": 8.597557640867308,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1023,
    "reward_mean": -3.218811970378994,
    "reward_max": 5.72662383797367,
    "reward_min": -40.718406142183646,
    "reward_std": 7.815263429557664,
    "timesteps": 360547266,
    "learntime": 0.2380446051247418,
    "sampletime": 8.591347453882918,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1024,
    "reward_mean": 2.531522012503568,
    "reward_max": 6.116183106484114,
    "reward_min": -23.207415564578366,
    "reward_std": 5.040229774404246,
    "timesteps": 360903072,
    "learntime": 0.20541436900384724,
    "sampletime": 8.714333884883672,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1025,
    "reward_mean": 2.767999242730991,
    "reward_max": 6.002652465619821,
    "reward_min": -21.210582165997852,
    "reward_std": 4.674003309617286,
    "timesteps": 361260249,
    "learntime": 0.25181192392483354,
    "sampletime": 8.728377467952669,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1026,
    "reward_mean": 1.0618225356401694,
    "reward_max": 6.138208988997519,
    "reward_min": -15.316110962372813,
    "reward_std": 5.84429862643053,
    "timesteps": 361614420,
    "learntime": 0.20568990684114397,
    "sampletime": 8.7786667291075,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1027,
    "reward_mean": 2.253531367941019,
    "reward_max": 5.732921864105786,
    "reward_min": -14.574496621347146,
    "reward_std": 4.795959070882314,
    "timesteps": 361972626,
    "learntime": 0.23850952903740108,
    "sampletime": 8.777958394028246,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1028,
    "reward_mean": 0.5138599009621312,
    "reward_max": 5.991040434124771,
    "reward_min": -20.588570732857793,
    "reward_std": 6.480934398464707,
    "timesteps": 362326176,
    "learntime": 0.21908276295289397,
    "sampletime": 8.597323111956939,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1029,
    "reward_mean": 2.5883061594163457,
    "reward_max": 5.400739732512826,
    "reward_min": -6.654552756646427,
    "reward_std": 3.4411727953903917,
    "timesteps": 362684622,
    "learntime": 0.2542862109839916,
    "sampletime": 8.669359078165144,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1030,
    "reward_mean": 1.7457812982662082,
    "reward_max": 5.700668191687188,
    "reward_min": -14.669082400353744,
    "reward_std": 4.203585941477171,
    "timesteps": 363041631,
    "learntime": 0.21177848312072456,
    "sampletime": 8.653013532981277,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1031,
    "reward_mean": 3.608507894966725,
    "reward_max": 4.764629682660044,
    "reward_min": 2.3560080771761296,
    "reward_std": 0.5376012047872637,
    "timesteps": 363402351,
    "learntime": 0.2416329849511385,
    "sampletime": 8.724244605982676,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1032,
    "reward_mean": 3.4102821404471255,
    "reward_max": 5.881569791731128,
    "reward_min": -6.537190721264451,
    "reward_std": 2.168365120474419,
    "timesteps": 363762519,
    "learntime": 0.22672302182763815,
    "sampletime": 8.661043827887625,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1033,
    "reward_mean": 0.9408751132778028,
    "reward_max": 5.139662885137086,
    "reward_min": -15.737247401269007,
    "reward_std": 4.9046058905084875,
    "timesteps": 364117242,
    "learntime": 0.24502058885991573,
    "sampletime": 8.470463183009997,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1034,
    "reward_mean": 2.76718926295868,
    "reward_max": 4.218639492925086,
    "reward_min": -6.063358237802859,
    "reward_std": 1.9296191994874512,
    "timesteps": 364477206,
    "learntime": 0.2141558500006795,
    "sampletime": 8.624985032016411,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1035,
    "reward_mean": 2.3595057497974823,
    "reward_max": 4.937555483786935,
    "reward_min": -6.319404255249541,
    "reward_std": 2.612458661391213,
    "timesteps": 364835979,
    "learntime": 0.2429913878440857,
    "sampletime": 8.988322673132643,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1036,
    "reward_mean": 2.7106037457425676,
    "reward_max": 4.285771542836705,
    "reward_min": -6.436868514488169,
    "reward_std": 2.0110698167571393,
    "timesteps": 365195934,
    "learntime": 0.20943677611649036,
    "sampletime": 8.800003748154268,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1037,
    "reward_mean": 2.600208626526981,
    "reward_max": 4.482198661314957,
    "reward_min": -6.1233820028596035,
    "reward_std": 1.9203719631181118,
    "timesteps": 365555520,
    "learntime": 0.23725756886415184,
    "sampletime": 8.770498716039583,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1038,
    "reward_mean": 1.4205568459709599,
    "reward_max": 4.729299983394217,
    "reward_min": -20.57206463249572,
    "reward_std": 4.538275806516186,
    "timesteps": 365910756,
    "learntime": 0.2234329639468342,
    "sampletime": 8.733955625910312,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1039,
    "reward_mean": 2.1988987526451,
    "reward_max": 4.09690868805487,
    "reward_min": -6.72983738901729,
    "reward_std": 2.6037051039865244,
    "timesteps": 366269895,
    "learntime": 0.2350545630324632,
    "sampletime": 8.80125271808356,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1040,
    "reward_mean": 1.59896195078883,
    "reward_max": 3.7640790893258793,
    "reward_min": -6.743143304963739,
    "reward_std": 3.057050196980114,
    "timesteps": 366627618,
    "learntime": 0.20605951291508973,
    "sampletime": 8.715622965013608,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1041,
    "reward_mean": 2.8049827020924836,
    "reward_max": 3.762798771225127,
    "reward_min": 2.1073173388210815,
    "reward_std": 0.34496877487742833,
    "timesteps": 366988338,
    "learntime": 0.2608127109706402,
    "sampletime": 8.572460680035874,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1042,
    "reward_mean": 2.566668972883165,
    "reward_max": 4.062202511923026,
    "reward_min": -6.351942574838177,
    "reward_std": 1.953223008278326,
    "timesteps": 367347969,
    "learntime": 0.21302380412817,
    "sampletime": 8.672233018092811,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1043,
    "reward_mean": 1.5095189111589806,
    "reward_max": 4.071873022136665,
    "reward_min": -13.925083987303275,
    "reward_std": 3.4402510729854336,
    "timesteps": 367705605,
    "learntime": 0.2621699220035225,
    "sampletime": 8.569007805082947,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1044,
    "reward_mean": 3.0962284769109116,
    "reward_max": 4.788676390088352,
    "reward_min": 2.2454379823016493,
    "reward_std": 0.5114153191473849,
    "timesteps": 368066325,
    "learntime": 0.21369324112311006,
    "sampletime": 8.933210670016706,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1045,
    "reward_mean": 2.9294467887812603,
    "reward_max": 4.732413030151897,
    "reward_min": 2.128293959011152,
    "reward_std": 0.4767522691540933,
    "timesteps": 368427045,
    "learntime": 0.2482287068851292,
    "sampletime": 8.689529058989137,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1046,
    "reward_mean": 2.3137340310233814,
    "reward_max": 3.7379097819864486,
    "reward_min": -6.398549281637044,
    "reward_std": 1.8083521341972617,
    "timesteps": 368786631,
    "learntime": 0.2068306829314679,
    "sampletime": 8.685798395890743,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1047,
    "reward_mean": 2.3379154451524764,
    "reward_max": 3.8136306557571484,
    "reward_min": -5.921912753968641,
    "reward_std": 1.7555011461335088,
    "timesteps": 369146205,
    "learntime": 0.2553441319614649,
    "sampletime": 8.712745854863897,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1048,
    "reward_mean": 2.284536439816283,
    "reward_max": 3.608246758058101,
    "reward_min": -5.8585497990716275,
    "reward_std": 1.7901291481832018,
    "timesteps": 369505845,
    "learntime": 0.2141529149375856,
    "sampletime": 8.71553694200702,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1049,
    "reward_mean": 2.450796218809782,
    "reward_max": 3.9405114932627736,
    "reward_min": -6.1732678001351475,
    "reward_std": 1.9478255819260255,
    "timesteps": 369865464,
    "learntime": 0.21496059303171933,
    "sampletime": 8.832257733913139,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1050,
    "reward_mean": 2.9531932574448203,
    "reward_max": 4.147530670387133,
    "reward_min": 2.0058865145029885,
    "reward_std": 0.39670663635139525,
    "timesteps": 370226184,
    "learntime": 0.19890903495252132,
    "sampletime": 8.83954364201054,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1051,
    "reward_mean": 2.525489671319158,
    "reward_max": 4.445945206803805,
    "reward_min": -6.188020141848196,
    "reward_std": 1.8312578336573835,
    "timesteps": 370585881,
    "learntime": 0.2599348952062428,
    "sampletime": 8.72985365614295,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1052,
    "reward_mean": 2.7325689738166226,
    "reward_max": 4.1965270018812975,
    "reward_min": -14.451039432788754,
    "reward_std": 2.5130734389923055,
    "timesteps": 370945542,
    "learntime": 0.2700154180638492,
    "sampletime": 8.962327316170558,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1053,
    "reward_mean": 2.901635513919861,
    "reward_max": 4.01361882966673,
    "reward_min": 2.19598223277452,
    "reward_std": 0.334620236574277,
    "timesteps": 371306262,
    "learntime": 0.21180319413542747,
    "sampletime": 8.838206665124744,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1054,
    "reward_mean": 3.000330779081292,
    "reward_max": 4.197672472667883,
    "reward_min": 1.7569095699370563,
    "reward_std": 0.503660065566778,
    "timesteps": 371666982,
    "learntime": 0.20877288095653057,
    "sampletime": 8.733373370021582,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1055,
    "reward_mean": 3.220577702009755,
    "reward_max": 4.886230733737141,
    "reward_min": 2.2662437528682244,
    "reward_std": 0.5292237639999106,
    "timesteps": 372027702,
    "learntime": 0.2673018320929259,
    "sampletime": 8.809757891111076,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1056,
    "reward_mean": 2.3166865103670085,
    "reward_max": 4.5741171660783655,
    "reward_min": -7.329892460426149,
    "reward_std": 2.8618798203726064,
    "timesteps": 372387642,
    "learntime": 0.21851227385923266,
    "sampletime": 8.96299272403121,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1057,
    "reward_mean": 3.135988963404921,
    "reward_max": 4.083248245547468,
    "reward_min": 2.0412769322142434,
    "reward_std": 0.4125813944824039,
    "timesteps": 372748362,
    "learntime": 0.25378012494184077,
    "sampletime": 8.840540566015989,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1058,
    "reward_mean": 3.3537859557257343,
    "reward_max": 4.5056037895917616,
    "reward_min": 2.594334026555189,
    "reward_std": 0.41582016757412776,
    "timesteps": 373109082,
    "learntime": 0.20644935709424317,
    "sampletime": 8.755580576136708,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1059,
    "reward_mean": 2.649764925637688,
    "reward_max": 4.42798949223343,
    "reward_min": -5.836407587292012,
    "reward_std": 1.920503801907497,
    "timesteps": 373469343,
    "learntime": 0.2566721378825605,
    "sampletime": 8.869708816986531,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1060,
    "reward_mean": 2.6434180297033185,
    "reward_max": 4.746332084343792,
    "reward_min": -5.917015441495814,
    "reward_std": 2.5411582324343454,
    "timesteps": 373828473,
    "learntime": 0.20903850113973022,
    "sampletime": 8.918795798905194,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1061,
    "reward_mean": 2.869939254276476,
    "reward_max": 4.771482768973022,
    "reward_min": -5.884850210312641,
    "reward_std": 2.627390747229071,
    "timesteps": 374187759,
    "learntime": 0.2418838820885867,
    "sampletime": 8.83149540098384,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1062,
    "reward_mean": 2.761251463523833,
    "reward_max": 4.738524774084383,
    "reward_min": -5.851394647481908,
    "reward_std": 2.673032531430058,
    "timesteps": 374546406,
    "learntime": 0.21009555808268487,
    "sampletime": 8.652704895939678,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1063,
    "reward_mean": 3.3868008065952377,
    "reward_max": 4.994606160823924,
    "reward_min": -4.706934145193151,
    "reward_std": 1.8230835975248219,
    "timesteps": 374906151,
    "learntime": 0.26040288619697094,
    "sampletime": 8.73055007099174,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1064,
    "reward_mean": 3.96257663423362,
    "reward_max": 5.050467179419654,
    "reward_min": 2.5738442558089645,
    "reward_std": 0.58926366795136,
    "timesteps": 375266871,
    "learntime": 0.2110605901107192,
    "sampletime": 8.651351731969044,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1065,
    "reward_mean": 3.696438945003263,
    "reward_max": 5.734393046839003,
    "reward_min": -5.385844015937909,
    "reward_std": 2.019871069135891,
    "timesteps": 375626517,
    "learntime": 0.24597492697648704,
    "sampletime": 8.676146606914699,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1066,
    "reward_mean": 4.036469690410115,
    "reward_max": 5.650817338638287,
    "reward_min": 2.9132380018418176,
    "reward_std": 0.5893145614470945,
    "timesteps": 375987237,
    "learntime": 0.21296734013594687,
    "sampletime": 8.76062381803058,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1067,
    "reward_mean": 3.851856439897459,
    "reward_max": 6.07937364686619,
    "reward_min": -5.731642202812845,
    "reward_std": 2.0369605182840345,
    "timesteps": 376347405,
    "learntime": 0.2529790219850838,
    "sampletime": 8.716765604913235,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1068,
    "reward_mean": 3.3295742522170144,
    "reward_max": 5.690690144657207,
    "reward_min": -6.286036998590907,
    "reward_std": 2.818243448236162,
    "timesteps": 376707354,
    "learntime": 0.210536093916744,
    "sampletime": 8.782329040812328,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1069,
    "reward_mean": 2.5054124322636864,
    "reward_max": 5.957012204525222,
    "reward_min": -12.700721755122592,
    "reward_std": 3.820421383282092,
    "timesteps": 377065497,
    "learntime": 0.2604496341664344,
    "sampletime": 8.676019120030105,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1070,
    "reward_mean": 4.320101002408389,
    "reward_max": 5.870808734498549,
    "reward_min": 2.542624171787984,
    "reward_std": 0.65955089805491,
    "timesteps": 377426217,
    "learntime": 0.21484984713606536,
    "sampletime": 8.845369260990992,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1071,
    "reward_mean": 3.890393790379899,
    "reward_max": 6.046149480622262,
    "reward_min": -12.119809765940193,
    "reward_std": 3.011683859821801,
    "timesteps": 377785776,
    "learntime": 0.2759372121654451,
    "sampletime": 8.712970049818978,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1072,
    "reward_mean": 3.6355757977698904,
    "reward_max": 6.29996671049937,
    "reward_min": -12.501675994350633,
    "reward_std": 3.7212298164043403,
    "timesteps": 378144735,
    "learntime": 0.209190818015486,
    "sampletime": 8.841174629051238,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1073,
    "reward_mean": 4.392960804108138,
    "reward_max": 6.850933383416501,
    "reward_min": -3.8470193980381655,
    "reward_std": 1.806006897836774,
    "timesteps": 378505365,
    "learntime": 0.25124716898426414,
    "sampletime": 8.90963496803306,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1074,
    "reward_mean": 4.2255634373937525,
    "reward_max": 7.02553137261404,
    "reward_min": -4.581154276073601,
    "reward_std": 2.689998389259715,
    "timesteps": 378865686,
    "learntime": 0.22299301205202937,
    "sampletime": 8.93508738395758,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1075,
    "reward_mean": 3.2924277300831637,
    "reward_max": 6.322088691878663,
    "reward_min": -15.252987882027151,
    "reward_std": 4.021286373753388,
    "timesteps": 379223613,
    "learntime": 0.2701995170209557,
    "sampletime": 8.91348560503684,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1076,
    "reward_mean": 4.2961509734994445,
    "reward_max": 6.611100903401766,
    "reward_min": -4.37154962812466,
    "reward_std": 2.696343170334712,
    "timesteps": 379582746,
    "learntime": 0.21850907988846302,
    "sampletime": 8.870102104032412,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1077,
    "reward_mean": 3.578763379552748,
    "reward_max": 7.435235287172182,
    "reward_min": -10.104423468657645,
    "reward_std": 3.854100247755432,
    "timesteps": 379940067,
    "learntime": 0.2694791939575225,
    "sampletime": 8.877399572869763,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1078,
    "reward_mean": 4.948555880449208,
    "reward_max": 7.067911706696382,
    "reward_min": 3.458201618653467,
    "reward_std": 0.715519097306311,
    "timesteps": 380300787,
    "learntime": 0.2223165121395141,
    "sampletime": 8.811302280053496,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1079,
    "reward_mean": 2.8353840275758015,
    "reward_max": 6.701220383815877,
    "reward_min": -23.280775135340672,
    "reward_std": 4.745947264424725,
    "timesteps": 380659422,
    "learntime": 0.27424069796688855,
    "sampletime": 8.806586374994367,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1080,
    "reward_mean": 4.087171131632356,
    "reward_max": 6.837495602093191,
    "reward_min": -13.654351153283978,
    "reward_std": 3.9777705764508,
    "timesteps": 381018063,
    "learntime": 0.2110755278263241,
    "sampletime": 8.926801970927045,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1081,
    "reward_mean": 2.4994486181652724,
    "reward_max": 6.735919889046767,
    "reward_min": -22.830259136396993,
    "reward_std": 5.31154018877177,
    "timesteps": 381372348,
    "learntime": 0.2743673138320446,
    "sampletime": 8.75707811396569,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1082,
    "reward_mean": 3.935138309587161,
    "reward_max": 7.10341608931914,
    "reward_min": -5.555792215301404,
    "reward_std": 3.3676575795488404,
    "timesteps": 381731169,
    "learntime": 0.2061556470580399,
    "sampletime": 8.815295270876959,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1083,
    "reward_mean": 4.115183195922677,
    "reward_max": 7.126082304752231,
    "reward_min": -5.331788746767088,
    "reward_std": 3.175015363773509,
    "timesteps": 382090866,
    "learntime": 0.25453682988882065,
    "sampletime": 8.7884945939295,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1084,
    "reward_mean": 2.4582411632185996,
    "reward_max": 7.47740183370611,
    "reward_min": -21.76717359185304,
    "reward_std": 5.572046953034102,
    "timesteps": 382444836,
    "learntime": 0.20320371305570006,
    "sampletime": 8.791269300039858,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1085,
    "reward_mean": 2.044175277690994,
    "reward_max": 7.147370868856365,
    "reward_min": -12.600848431540449,
    "reward_std": 5.179671555849168,
    "timesteps": 382800282,
    "learntime": 0.21360140293836594,
    "sampletime": 8.573110469151288,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1086,
    "reward_mean": 3.183953577426333,
    "reward_max": 7.581600431165881,
    "reward_min": -21.483833589713683,
    "reward_std": 5.026270750736071,
    "timesteps": 383158428,
    "learntime": 0.2074733639601618,
    "sampletime": 8.63435319904238,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1087,
    "reward_mean": 2.9395281511633833,
    "reward_max": 7.3561168339100815,
    "reward_min": -13.42792840747103,
    "reward_std": 5.216297208598826,
    "timesteps": 383515599,
    "learntime": 0.21902291593141854,
    "sampletime": 8.835612462135032,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1088,
    "reward_mean": 2.3163099965781795,
    "reward_max": 6.766638774303082,
    "reward_min": -22.715385434796303,
    "reward_std": 5.051806592521334,
    "timesteps": 383872131,
    "learntime": 0.20985750178806484,
    "sampletime": 8.789078523870558,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1089,
    "reward_mean": 2.409378507398144,
    "reward_max": 6.632195014794377,
    "reward_min": -21.93772965212437,
    "reward_std": 5.6321535833713625,
    "timesteps": 384228765,
    "learntime": 0.21086747804656625,
    "sampletime": 8.669611129211262,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1090,
    "reward_mean": 4.252334652460909,
    "reward_max": 6.956277705510285,
    "reward_min": -4.983084515578499,
    "reward_std": 3.294768853275101,
    "timesteps": 384587073,
    "learntime": 0.2096001689787954,
    "sampletime": 8.810496194986627,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1091,
    "reward_mean": 4.141297660209769,
    "reward_max": 7.218715611916397,
    "reward_min": -3.9899849277660007,
    "reward_std": 3.0900864514582684,
    "timesteps": 384945534,
    "learntime": 0.21687584510073066,
    "sampletime": 8.822885908884928,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1092,
    "reward_mean": 4.228847817302968,
    "reward_max": 6.829360110180761,
    "reward_min": -4.5988708540945415,
    "reward_std": 3.0381866751488706,
    "timesteps": 385305828,
    "learntime": 0.215462117921561,
    "sampletime": 8.818261817097664,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1093,
    "reward_mean": 4.1531697722954535,
    "reward_max": 7.562282081294112,
    "reward_min": -12.191989422868481,
    "reward_std": 3.55102409357997,
    "timesteps": 385664751,
    "learntime": 0.2145115821622312,
    "sampletime": 8.799125033896416,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1094,
    "reward_mean": 3.752617789201829,
    "reward_max": 7.121001231868115,
    "reward_min": -13.921442722361963,
    "reward_std": 4.322673407265013,
    "timesteps": 386022399,
    "learntime": 0.21994533902034163,
    "sampletime": 8.819094644160941,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1095,
    "reward_mean": 2.5651872903528288,
    "reward_max": 6.867127752879039,
    "reward_min": -21.795389045738958,
    "reward_std": 5.543952968796617,
    "timesteps": 386378016,
    "learntime": 0.20252742408774793,
    "sampletime": 8.646773137152195,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1096,
    "reward_mean": 4.791891055002038,
    "reward_max": 7.599145946321896,
    "reward_min": -4.083359661515605,
    "reward_std": 2.717578745778338,
    "timesteps": 386737710,
    "learntime": 0.2172032380476594,
    "sampletime": 8.814788510091603,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1097,
    "reward_mean": 3.6545992887136007,
    "reward_max": 6.772170769989091,
    "reward_min": -4.505007632549461,
    "reward_std": 3.4529780842460895,
    "timesteps": 387096765,
    "learntime": 0.20721593988128006,
    "sampletime": 8.837149061029777,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1098,
    "reward_mean": 5.213947291996893,
    "reward_max": 7.253465849442304,
    "reward_min": -3.8219942503739315,
    "reward_std": 1.925917776584706,
    "timesteps": 387457209,
    "learntime": 0.21046146587468684,
    "sampletime": 8.79392243293114,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1099,
    "reward_mean": 4.011501149210067,
    "reward_max": 7.133738249204016,
    "reward_min": -13.956415167504355,
    "reward_std": 3.703256858003519,
    "timesteps": 387816255,
    "learntime": 0.21353450906462967,
    "sampletime": 8.79362595709972,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1100,
    "reward_mean": 4.11169408161665,
    "reward_max": 6.41028677308085,
    "reward_min": -4.9288891171966025,
    "reward_std": 2.691275282611539,
    "timesteps": 388175829,
    "learntime": 0.20851682499051094,
    "sampletime": 8.829182173125446,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1101,
    "reward_mean": 4.342262566317167,
    "reward_max": 6.675646786721089,
    "reward_min": -4.131464571569022,
    "reward_std": 2.5842723168480792,
    "timesteps": 388535124,
    "learntime": 0.2171684829518199,
    "sampletime": 8.809899308020249,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1102,
    "reward_mean": 3.6253181090626607,
    "reward_max": 7.352405997331842,
    "reward_min": -13.661245767947001,
    "reward_std": 3.909851113140628,
    "timesteps": 388894203,
    "learntime": 0.21625243197195232,
    "sampletime": 8.945867349859327,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1103,
    "reward_mean": 5.146516865153826,
    "reward_max": 6.763065430917778,
    "reward_min": 3.5932046108681557,
    "reward_std": 0.7625810714711494,
    "timesteps": 389254923,
    "learntime": 0.20928560802713037,
    "sampletime": 8.872144490946084,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1104,
    "reward_mean": 3.2872758963421416,
    "reward_max": 6.447506677846163,
    "reward_min": -13.647811842903279,
    "reward_std": 4.181939604361544,
    "timesteps": 389614875,
    "learntime": 0.2125160361174494,
    "sampletime": 8.793466908857226,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1105,
    "reward_mean": 4.661752132660643,
    "reward_max": 7.050862532380655,
    "reward_min": -14.10681419500686,
    "reward_std": 2.6442251075567405,
    "timesteps": 389975247,
    "learntime": 0.21578019694425166,
    "sampletime": 8.767318347934633,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1106,
    "reward_mean": 4.609233169434191,
    "reward_max": 6.392147650958079,
    "reward_min": -11.790135249230337,
    "reward_std": 2.4824999580776175,
    "timesteps": 390335634,
    "learntime": 0.20888550602830946,
    "sampletime": 9.003290199209005,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1107,
    "reward_mean": 4.999501918252582,
    "reward_max": 6.693332368334236,
    "reward_min": 3.3607122673808267,
    "reward_std": 0.6935033544267973,
    "timesteps": 390696354,
    "learntime": 0.20406413986347616,
    "sampletime": 8.72675570496358,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1108,
    "reward_mean": 4.538300184815047,
    "reward_max": 6.666979286375199,
    "reward_min": -5.018464759620135,
    "reward_std": 2.154199479305254,
    "timesteps": 391056372,
    "learntime": 0.21486356505192816,
    "sampletime": 8.650471756001934,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1109,
    "reward_mean": 4.815770508312196,
    "reward_max": 7.676124904606359,
    "reward_min": -4.929051195962755,
    "reward_std": 2.104020349132166,
    "timesteps": 391416675,
    "learntime": 0.21058092103339732,
    "sampletime": 8.82917349296622,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1110,
    "reward_mean": 4.213024506877106,
    "reward_max": 6.740864473281274,
    "reward_min": -5.127964319942601,
    "reward_std": 2.1927510313607317,
    "timesteps": 391777065,
    "learntime": 0.21381148812361062,
    "sampletime": 8.75253039994277,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1111,
    "reward_mean": 4.915927761358432,
    "reward_max": 6.46913718182071,
    "reward_min": 3.3401137142181025,
    "reward_std": 0.684058012045881,
    "timesteps": 392137785,
    "learntime": 0.21232728101313114,
    "sampletime": 8.747960281092674,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1112,
    "reward_mean": 4.340763265956044,
    "reward_max": 6.189091795565077,
    "reward_min": -4.6105663940397825,
    "reward_std": 1.942869377000847,
    "timesteps": 392497959,
    "learntime": 0.221853501861915,
    "sampletime": 8.581120043992996,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1113,
    "reward_mean": 5.02823992854807,
    "reward_max": 7.648595171825335,
    "reward_min": 3.4436864497238804,
    "reward_std": 0.8705873807679168,
    "timesteps": 392858679,
    "learntime": 0.2140769069083035,
    "sampletime": 8.71098662703298,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1114,
    "reward_mean": 4.983457934149817,
    "reward_max": 6.460147557653147,
    "reward_min": 3.3196923753253684,
    "reward_std": 0.6963830578860629,
    "timesteps": 393219399,
    "learntime": 0.21435539005324244,
    "sampletime": 8.76997759588994,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1115,
    "reward_mean": 5.077896162061153,
    "reward_max": 6.751125717997749,
    "reward_min": 3.3730556410713066,
    "reward_std": 0.7701935654080889,
    "timesteps": 393580119,
    "learntime": 0.20926957810297608,
    "sampletime": 8.836777914082631,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1116,
    "reward_mean": 4.383191507030507,
    "reward_max": 6.956684920016082,
    "reward_min": -4.976391169284895,
    "reward_std": 2.0134859063371153,
    "timesteps": 393940068,
    "learntime": 0.20486670010723174,
    "sampletime": 8.818363429047167,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1117,
    "reward_mean": 4.846834426594972,
    "reward_max": 6.528417585039276,
    "reward_min": 3.3933549962486267,
    "reward_std": 0.6745111596921093,
    "timesteps": 394300788,
    "learntime": 0.20809826906770468,
    "sampletime": 8.801122447941452,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1118,
    "reward_mean": 5.108551762387471,
    "reward_max": 6.754007272745098,
    "reward_min": 3.8298438574984717,
    "reward_std": 0.6352329999032094,
    "timesteps": 394661508,
    "learntime": 0.21565362787805498,
    "sampletime": 8.728741431143135,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1119,
    "reward_mean": 3.997432705732429,
    "reward_max": 7.0164486808723465,
    "reward_min": -14.458880402296382,
    "reward_std": 3.431951688226036,
    "timesteps": 395020773,
    "learntime": 0.21216084901243448,
    "sampletime": 8.836467797169462,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1120,
    "reward_mean": 4.48958695766398,
    "reward_max": 7.409709184847694,
    "reward_min": -11.623296409425771,
    "reward_std": 2.3751988807973174,
    "timesteps": 395380482,
    "learntime": 0.22191960783675313,
    "sampletime": 8.793695072177798,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1121,
    "reward_mean": 4.868555619820231,
    "reward_max": 6.708267750537768,
    "reward_min": -4.094947338457026,
    "reward_std": 1.919786165911548,
    "timesteps": 395740212,
    "learntime": 0.25870305486023426,
    "sampletime": 8.684865426039323,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1122,
    "reward_mean": 3.9473029850871817,
    "reward_max": 6.505342138687741,
    "reward_min": -4.950545231677646,
    "reward_std": 2.6517150295877725,
    "timesteps": 396099216,
    "learntime": 0.2111041839234531,
    "sampletime": 8.868234436959028,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1123,
    "reward_mean": 4.58888371960332,
    "reward_max": 6.651704245733773,
    "reward_min": -4.071559139192249,
    "reward_std": 1.9757066528927292,
    "timesteps": 396459777,
    "learntime": 0.2160725761204958,
    "sampletime": 8.965354442829266,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1124,
    "reward_mean": 5.177355931627758,
    "reward_max": 7.168805777024698,
    "reward_min": 3.545183143513206,
    "reward_std": 0.783319340198203,
    "timesteps": 396820497,
    "learntime": 0.25177780888043344,
    "sampletime": 8.931911461055279,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1125,
    "reward_mean": 4.510815359153721,
    "reward_max": 6.3288264588938725,
    "reward_min": -4.014793968203269,
    "reward_std": 1.8632479259573052,
    "timesteps": 397180539,
    "learntime": 0.2191727589815855,
    "sampletime": 8.76634722109884,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1126,
    "reward_mean": 4.534762655960632,
    "reward_max": 7.04504205051908,
    "reward_min": -3.8247560032824484,
    "reward_std": 1.885778607163793,
    "timesteps": 397540956,
    "learntime": 0.2656424611341208,
    "sampletime": 8.880553530994803,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1127,
    "reward_mean": 4.854302219098226,
    "reward_max": 6.630809932093445,
    "reward_min": 3.081884531138435,
    "reward_std": 0.8589611932791498,
    "timesteps": 397901676,
    "learntime": 0.21263682399876416,
    "sampletime": 8.934461052995175,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1128,
    "reward_mean": 4.701069682318359,
    "reward_max": 6.9360071658871725,
    "reward_min": -5.234780353099473,
    "reward_std": 2.198466299335629,
    "timesteps": 398261157,
    "learntime": 0.25229803612455726,
    "sampletime": 8.895059658912942,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1129,
    "reward_mean": 4.504607984575058,
    "reward_max": 6.8834329219887715,
    "reward_min": -4.3438518028071345,
    "reward_std": 2.692636761779414,
    "timesteps": 398620341,
    "learntime": 0.2209589439444244,
    "sampletime": 8.69037693599239,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1130,
    "reward_mean": 4.829026510724892,
    "reward_max": 7.208142210536713,
    "reward_min": -4.437535420332678,
    "reward_std": 1.9912314103003357,
    "timesteps": 398980011,
    "learntime": 0.2676683960016817,
    "sampletime": 8.86373388278298,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1131,
    "reward_mean": 4.823235429703103,
    "reward_max": 7.054280901352419,
    "reward_min": -5.079510230105374,
    "reward_std": 2.0454478478216056,
    "timesteps": 399340650,
    "learntime": 0.21364722098223865,
    "sampletime": 8.782608109991997,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1132,
    "reward_mean": 4.467947668155304,
    "reward_max": 6.5693935568730595,
    "reward_min": -4.922843562289381,
    "reward_std": 2.724592596010658,
    "timesteps": 399699186,
    "learntime": 0.24923656694591045,
    "sampletime": 8.708696888992563,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1133,
    "reward_mean": 5.482285276525751,
    "reward_max": 7.495115652180778,
    "reward_min": 3.788938358669505,
    "reward_std": 0.7593198483464355,
    "timesteps": 400059906,
    "learntime": 0.2153571827802807,
    "sampletime": 8.827654711902142,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1134,
    "reward_mean": 4.929139623127556,
    "reward_max": 7.379428889508054,
    "reward_min": -3.5550850008236923,
    "reward_std": 1.9390694895983254,
    "timesteps": 400419534,
    "learntime": 0.2701604769099504,
    "sampletime": 8.789570410968736,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1135,
    "reward_mean": 5.713575512428041,
    "reward_max": 7.538559582685894,
    "reward_min": 4.029008434408971,
    "reward_std": 0.8380208780508888,
    "timesteps": 400780254,
    "learntime": 0.2102561912033707,
    "sampletime": 8.82485022698529,
    "best_max_mean": -0.1261346636593036,
    "best_max": 7.682765036567367
  },
  {
    "gen": 1136,
    "reward_mean": 5.053212917816897,
    "reward_max": 7.814232334217661,
    "reward_min": -3.958682480736933,
    "reward_std": 2.0805369536167087,
    "timesteps": 401140038,
    "learntime": 0.2869955659843981,
    "sampletime": 8.755544673884287,
    "best_max_mean": 5.053212917816897,
    "best_max": 7.814232334217661
  },
  {
    "gen": 1137,
    "reward_mean": 4.5198553579404575,
    "reward_max": 7.4957267078800305,
    "reward_min": -5.7442213988447985,
    "reward_std": 2.8399987387799945,
    "timesteps": 401499693,
    "learntime": 0.2351975878700614,
    "sampletime": 8.866736431140453,
    "best_max_mean": 5.053212917816897,
    "best_max": 7.814232334217661
  },
  {
    "gen": 1138,
    "reward_mean": 5.320141770885867,
    "reward_max": 8.078238456224257,
    "reward_min": -4.59390936990773,
    "reward_std": 2.1148212800330763,
    "timesteps": 401860242,
    "learntime": 0.2507204730063677,
    "sampletime": 8.741037799045444,
    "best_max_mean": 5.320141770885867,
    "best_max": 8.078238456224257
  },
  {
    "gen": 1139,
    "reward_mean": 5.929400370321645,
    "reward_max": 8.48888685303664,
    "reward_min": 4.308429475686149,
    "reward_std": 0.7416311904052653,
    "timesteps": 402220962,
    "learntime": 0.22930793603882194,
    "sampletime": 8.739320916123688,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1140,
    "reward_mean": 5.551037223230713,
    "reward_max": 7.813403174898474,
    "reward_min": -3.9222922005000984,
    "reward_std": 2.1689148725179535,
    "timesteps": 402581493,
    "learntime": 0.2586936999578029,
    "sampletime": 8.878648587036878,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1141,
    "reward_mean": 4.801972033146255,
    "reward_max": 7.5964622754901105,
    "reward_min": -12.42925660400722,
    "reward_std": 3.161144913991383,
    "timesteps": 402940653,
    "learntime": 0.21790281310677528,
    "sampletime": 8.655824742047116,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1142,
    "reward_mean": 4.875615328511106,
    "reward_max": 7.592201686037391,
    "reward_min": -4.257087624538339,
    "reward_std": 2.795114261685438,
    "timesteps": 403299111,
    "learntime": 0.2479993721935898,
    "sampletime": 8.82076293695718,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1143,
    "reward_mean": 5.222903500791548,
    "reward_max": 7.58816468022349,
    "reward_min": -4.91223147055699,
    "reward_std": 2.2334948770524807,
    "timesteps": 403658685,
    "learntime": 0.21201055706478655,
    "sampletime": 8.857155930949375,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1144,
    "reward_mean": 3.8297101921761847,
    "reward_max": 7.971726068722391,
    "reward_min": -21.331640355130236,
    "reward_std": 4.8789280554126755,
    "timesteps": 404016711,
    "learntime": 0.25131580187007785,
    "sampletime": 8.71928232209757,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1145,
    "reward_mean": 3.4571182220425176,
    "reward_max": 7.2955959756659325,
    "reward_min": -19.375303160303954,
    "reward_std": 5.095929722595529,
    "timesteps": 404372004,
    "learntime": 0.21274259220808744,
    "sampletime": 8.728188161971048,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1146,
    "reward_mean": 5.523049188091813,
    "reward_max": 7.868069954675087,
    "reward_min": -3.721781227455448,
    "reward_std": 2.051232356565168,
    "timesteps": 404731740,
    "learntime": 0.2601913218386471,
    "sampletime": 8.860474758083,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1147,
    "reward_mean": 3.578422776035719,
    "reward_max": 7.417908329334967,
    "reward_min": -13.305800760425905,
    "reward_std": 4.919102194424725,
    "timesteps": 405088398,
    "learntime": 0.21129463193938136,
    "sampletime": 8.703241566894576,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1148,
    "reward_mean": 4.583292819488969,
    "reward_max": 7.624943453540086,
    "reward_min": -10.074955741839503,
    "reward_std": 3.303605606584819,
    "timesteps": 405446943,
    "learntime": 0.2795484790112823,
    "sampletime": 8.830477627925575,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1149,
    "reward_mean": 3.500543869968598,
    "reward_max": 7.880968986981313,
    "reward_min": -23.05770897324053,
    "reward_std": 5.334664822697448,
    "timesteps": 405805113,
    "learntime": 0.21158748189918697,
    "sampletime": 8.754708555992693,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1150,
    "reward_mean": 4.808836306611332,
    "reward_max": 7.020564243758352,
    "reward_min": -3.6235842258090902,
    "reward_std": 2.6245845635881464,
    "timesteps": 406164522,
    "learntime": 0.24860973889008164,
    "sampletime": 8.78065290604718,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1151,
    "reward_mean": 3.9163333633969417,
    "reward_max": 7.608666398093302,
    "reward_min": -12.998186599856565,
    "reward_std": 4.162186996637356,
    "timesteps": 406522521,
    "learntime": 0.21796678402461112,
    "sampletime": 8.756164391059428,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1152,
    "reward_mean": 5.503753845632316,
    "reward_max": 7.91834349490657,
    "reward_min": -3.3087806291931154,
    "reward_std": 1.9153619615860418,
    "timesteps": 406882206,
    "learntime": 0.24453474581241608,
    "sampletime": 8.906782880891114,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1153,
    "reward_mean": 2.520360672344805,
    "reward_max": 7.957732642402825,
    "reward_min": -12.881455922229433,
    "reward_std": 5.158894565644364,
    "timesteps": 407235228,
    "learntime": 0.21410176600329578,
    "sampletime": 8.717193817021325,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1154,
    "reward_mean": 4.592106951223705,
    "reward_max": 7.579530635531143,
    "reward_min": -12.313906311004759,
    "reward_std": 3.8719400607905237,
    "timesteps": 407594106,
    "learntime": 0.2522976470645517,
    "sampletime": 8.980817948002368,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1155,
    "reward_mean": 4.456412469821569,
    "reward_max": 7.4723934282673925,
    "reward_min": -4.720450405726409,
    "reward_std": 3.2574520132988116,
    "timesteps": 407952558,
    "learntime": 0.22395775583572686,
    "sampletime": 8.802504843100905,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1156,
    "reward_mean": 4.721935599061924,
    "reward_max": 8.35000130439099,
    "reward_min": -13.434668923241349,
    "reward_std": 3.79301566968999,
    "timesteps": 408311814,
    "learntime": 0.2225374390836805,
    "sampletime": 8.703311534132808,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1157,
    "reward_mean": 5.505661269161127,
    "reward_max": 7.355219146527408,
    "reward_min": -3.6823457738994936,
    "reward_std": 1.9994100690232932,
    "timesteps": 408671403,
    "learntime": 0.2156975029502064,
    "sampletime": 8.59746197401546,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1158,
    "reward_mean": 5.020589578275377,
    "reward_max": 7.725570042878667,
    "reward_min": -4.754648547471416,
    "reward_std": 2.7404299090129296,
    "timesteps": 409030113,
    "learntime": 0.27308464888483286,
    "sampletime": 8.736534838099033,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1159,
    "reward_mean": 2.7168910810862124,
    "reward_max": 7.988996316368378,
    "reward_min": -13.144101848748203,
    "reward_std": 5.4897666056004635,
    "timesteps": 409385727,
    "learntime": 0.24436973594129086,
    "sampletime": 8.746767978183925,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1160,
    "reward_mean": 4.384549589461999,
    "reward_max": 7.244780389909548,
    "reward_min": -12.18831573063543,
    "reward_std": 3.7945925312848945,
    "timesteps": 409743291,
    "learntime": 0.21023909910582006,
    "sampletime": 8.786824424983934,
    "best_max_mean": 5.929400370321645,
    "best_max": 8.48888685303664
  },
  {
    "gen": 1161,
    "reward_mean": 4.778841603257215,
    "reward_max": 8.933576528949546,
    "reward_min": -12.968886610219313,
    "reward_std": 3.6953866604624444,
    "timesteps": 410100537,
    "learntime": 0.21356638008728623,
    "sampletime": 8.854914183961228,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1162,
    "reward_mean": 5.105110096141771,
    "reward_max": 8.57808350376294,
    "reward_min": -4.274509582373979,
    "reward_std": 2.7158681337985424,
    "timesteps": 410459223,
    "learntime": 0.22979561192914844,
    "sampletime": 8.766095196129754,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1163,
    "reward_mean": 4.245662817758144,
    "reward_max": 8.056531281457422,
    "reward_min": -12.466473112587915,
    "reward_std": 5.050157397032748,
    "timesteps": 410814690,
    "learntime": 0.23780342587269843,
    "sampletime": 8.812540732091293,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1164,
    "reward_mean": 4.768924217111863,
    "reward_max": 7.783437262137971,
    "reward_min": -12.334969554148056,
    "reward_std": 3.052503882871041,
    "timesteps": 411174153,
    "learntime": 0.21152934711426497,
    "sampletime": 8.647929872153327,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1165,
    "reward_mean": 5.244618313061893,
    "reward_max": 8.038147623855108,
    "reward_min": -3.0060543584263466,
    "reward_std": 2.578655614136341,
    "timesteps": 411532887,
    "learntime": 0.2068421421572566,
    "sampletime": 8.851160123944283,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1166,
    "reward_mean": 4.600253628509604,
    "reward_max": 8.129963544747701,
    "reward_min": -5.0029650976895494,
    "reward_std": 3.2841779480125424,
    "timesteps": 411890763,
    "learntime": 0.21745923394337296,
    "sampletime": 8.78814860386774,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1167,
    "reward_mean": 4.7452614042756025,
    "reward_max": 7.498054161272716,
    "reward_min": -4.741285387186734,
    "reward_std": 2.9096179040157466,
    "timesteps": 412249233,
    "learntime": 0.2171050941105932,
    "sampletime": 8.797773800091818,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1168,
    "reward_mean": 4.774481756657082,
    "reward_max": 7.630274890562177,
    "reward_min": -3.9536790164878997,
    "reward_std": 2.7539381301909907,
    "timesteps": 412607793,
    "learntime": 0.22148939687758684,
    "sampletime": 8.943471080157906,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1169,
    "reward_mean": 5.207064284954887,
    "reward_max": 8.199118068840379,
    "reward_min": -4.643933020158195,
    "reward_std": 2.7455464630872526,
    "timesteps": 412966392,
    "learntime": 0.21251382096670568,
    "sampletime": 8.755890782224014,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1170,
    "reward_mean": 5.485447404538526,
    "reward_max": 7.91828755149838,
    "reward_min": -3.7798993278958033,
    "reward_std": 2.0874713925650283,
    "timesteps": 413326062,
    "learntime": 0.21366276103071868,
    "sampletime": 8.776968962047249,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1171,
    "reward_mean": 4.447587200901756,
    "reward_max": 8.349589829382515,
    "reward_min": -12.285263134773816,
    "reward_std": 3.9802603222950372,
    "timesteps": 413682246,
    "learntime": 0.21309912600554526,
    "sampletime": 8.744288366055116,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1172,
    "reward_mean": 5.7136783870866985,
    "reward_max": 8.027171359443331,
    "reward_min": -11.542314614440935,
    "reward_std": 2.5183075754945663,
    "timesteps": 414042117,
    "learntime": 0.21329785999841988,
    "sampletime": 8.826542861992493,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1173,
    "reward_mean": 5.864222564530938,
    "reward_max": 7.628368927222303,
    "reward_min": 4.280164620340851,
    "reward_std": 0.7528743422368933,
    "timesteps": 414402837,
    "learntime": 0.23026807303540409,
    "sampletime": 8.859719429863617,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1174,
    "reward_mean": 4.481814584297576,
    "reward_max": 7.717606425904017,
    "reward_min": -4.636228624784222,
    "reward_std": 3.3179156968944707,
    "timesteps": 414760494,
    "learntime": 0.20709598390385509,
    "sampletime": 8.670687850099057,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1175,
    "reward_mean": 5.156345907398579,
    "reward_max": 8.356508361658955,
    "reward_min": -3.8312425041133853,
    "reward_std": 2.0865582727784635,
    "timesteps": 415120173,
    "learntime": 0.21841582795605063,
    "sampletime": 8.751978491898626,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1176,
    "reward_mean": 5.594573224716807,
    "reward_max": 8.05919711235699,
    "reward_min": -3.751687215608806,
    "reward_std": 1.9352255874840791,
    "timesteps": 415479945,
    "learntime": 0.22028318606317043,
    "sampletime": 8.825629881117493,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1177,
    "reward_mean": 5.574860140727498,
    "reward_max": 7.180031648004482,
    "reward_min": 3.919022938853945,
    "reward_std": 0.6552714910339239,
    "timesteps": 415840665,
    "learntime": 0.22941294917836785,
    "sampletime": 8.869108335115016,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1178,
    "reward_mean": 4.191853555255005,
    "reward_max": 7.453209057900076,
    "reward_min": -4.541564800074524,
    "reward_std": 3.3776218333013226,
    "timesteps": 416198223,
    "learntime": 0.2172112138941884,
    "sampletime": 8.683959990972653,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1179,
    "reward_mean": 3.9199807767250916,
    "reward_max": 7.164755695704088,
    "reward_min": -19.277850260845103,
    "reward_std": 4.202477993436212,
    "timesteps": 416554971,
    "learntime": 0.21846392005681992,
    "sampletime": 8.716943994862959,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1180,
    "reward_mean": 5.457643891800603,
    "reward_max": 8.387994924176551,
    "reward_min": -12.488008028817024,
    "reward_std": 2.6390832987655903,
    "timesteps": 416914539,
    "learntime": 0.2238339320756495,
    "sampletime": 8.903744611889124,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1181,
    "reward_mean": 5.221564931763956,
    "reward_max": 7.4433286993192835,
    "reward_min": -4.437612181655522,
    "reward_std": 2.024616551660015,
    "timesteps": 417274344,
    "learntime": 0.22205784218385816,
    "sampletime": 8.818477049004287,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1182,
    "reward_mean": 4.6975432326701,
    "reward_max": 7.423750955177553,
    "reward_min": -22.562834255616043,
    "reward_std": 4.363882098097813,
    "timesteps": 417631869,
    "learntime": 0.21255336795002222,
    "sampletime": 8.898733315989375,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1183,
    "reward_mean": 4.88277240017309,
    "reward_max": 7.715726973817885,
    "reward_min": -4.1432367292948085,
    "reward_std": 2.747439279617988,
    "timesteps": 417990648,
    "learntime": 0.228414470795542,
    "sampletime": 8.793156744912267,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1184,
    "reward_mean": 5.2288986414699625,
    "reward_max": 8.19117189140701,
    "reward_min": -3.2766316425933706,
    "reward_std": 1.986556465285703,
    "timesteps": 418350285,
    "learntime": 0.21787996194325387,
    "sampletime": 8.808578302152455,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1185,
    "reward_mean": 5.194554424530136,
    "reward_max": 7.93049940422431,
    "reward_min": -4.01254618453095,
    "reward_std": 2.0326204027975554,
    "timesteps": 418709829,
    "learntime": 0.21040264796465635,
    "sampletime": 8.867033974034712,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1186,
    "reward_mean": 5.59093466024916,
    "reward_max": 7.930372417199766,
    "reward_min": 3.09867966975111,
    "reward_std": 0.9220348250067024,
    "timesteps": 419070549,
    "learntime": 0.20936081395484507,
    "sampletime": 8.859080805908889,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1187,
    "reward_mean": 5.778576604547679,
    "reward_max": 7.6062646265067535,
    "reward_min": 2.640530451525452,
    "reward_std": 0.9241919940095327,
    "timesteps": 419431269,
    "learntime": 0.21407954511232674,
    "sampletime": 8.770341145107523,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1188,
    "reward_mean": 5.478629706098892,
    "reward_max": 7.502514860733888,
    "reward_min": -3.626579426283684,
    "reward_std": 2.0107465146753216,
    "timesteps": 419790882,
    "learntime": 0.22255586204119027,
    "sampletime": 8.780198449036106,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1189,
    "reward_mean": 5.761433924791925,
    "reward_max": 8.012197553587608,
    "reward_min": 3.6761900160183534,
    "reward_std": 0.858041092561143,
    "timesteps": 420151602,
    "learntime": 0.2146435792092234,
    "sampletime": 8.888186816126108,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1190,
    "reward_mean": 4.652413244007624,
    "reward_max": 7.7579558122846635,
    "reward_min": -3.6210266444902626,
    "reward_std": 3.1828059531423456,
    "timesteps": 420509652,
    "learntime": 0.2171563389711082,
    "sampletime": 8.90834356797859,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1191,
    "reward_mean": 5.672250683195912,
    "reward_max": 8.226229060222096,
    "reward_min": 3.678324287406412,
    "reward_std": 0.8120592182227687,
    "timesteps": 420870372,
    "learntime": 0.2088837579358369,
    "sampletime": 8.793240250088274,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1192,
    "reward_mean": 5.4196501419801555,
    "reward_max": 7.714136534765587,
    "reward_min": -4.304840265622429,
    "reward_std": 2.152579256642157,
    "timesteps": 421229943,
    "learntime": 0.2571167000569403,
    "sampletime": 8.797003287123516,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1193,
    "reward_mean": 6.272792343515216,
    "reward_max": 8.377633504788246,
    "reward_min": 4.291007985332699,
    "reward_std": 0.8245812215500201,
    "timesteps": 421590663,
    "learntime": 0.26426310115493834,
    "sampletime": 8.763092248002067,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1194,
    "reward_mean": 5.914491638168786,
    "reward_max": 7.640246730770516,
    "reward_min": 4.074068125832124,
    "reward_std": 0.8004758459906318,
    "timesteps": 421951383,
    "learntime": 0.21973144100047648,
    "sampletime": 8.835860203951597,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1195,
    "reward_mean": 5.6389803347949945,
    "reward_max": 8.036484807468666,
    "reward_min": -3.280247460130013,
    "reward_std": 2.0347331260341917,
    "timesteps": 422311005,
    "learntime": 0.2252562679350376,
    "sampletime": 8.819280290976167,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1196,
    "reward_mean": 5.13746073531277,
    "reward_max": 7.697934683423778,
    "reward_min": -5.050200725435639,
    "reward_std": 2.9390590522521807,
    "timesteps": 422669799,
    "learntime": 0.2707619199063629,
    "sampletime": 8.851792372995988,
    "best_max_mean": 4.778841603257215,
    "best_max": 8.933576528949546
  },
  {
    "gen": 1197,
    "reward_mean": 5.889387478009102,
    "reward_max": 9.331144762518603,
    "reward_min": -4.014801184744132,
    "reward_std": 2.1118254720797602,
    "timesteps": 423029541,
    "learntime": 0.22098257602192461,
    "sampletime": 8.789636973990127,
    "best_max_mean": 5.889387478009102,
    "best_max": 9.331144762518603
  },
  {
    "gen": 1198,
    "reward_mean": 6.671526063676533,
    "reward_max": 9.96469847913712,
    "reward_min": 4.871608965305817,
    "reward_std": 0.9973709136599568,
    "timesteps": 423390261,
    "learntime": 0.2707360570784658,
    "sampletime": 8.794786576880142,
    "best_max_mean": 6.671526063676533,
    "best_max": 9.96469847913712
  },
  {
    "gen": 1199,
    "reward_mean": 6.541654306675046,
    "reward_max": 9.031911899720196,
    "reward_min": -2.4073470323470034,
    "reward_std": 2.1265231833988962,
    "timesteps": 423750507,
    "learntime": 0.2245238700415939,
    "sampletime": 8.889993282034993,
    "best_max_mean": 6.671526063676533,
    "best_max": 9.96469847913712
  },
  {
    "gen": 1200,
    "reward_mean": 7.09018450416663,
    "reward_max": 9.266992764051816,
    "reward_min": 5.167580809361283,
    "reward_std": 0.9300547738252515,
    "timesteps": 424111227,
    "learntime": 0.26186677790246904,
    "sampletime": 8.882287885993719,
    "best_max_mean": 6.671526063676533,
    "best_max": 9.96469847913712
  },
  {
    "gen": 1201,
    "reward_mean": 5.713915405157359,
    "reward_max": 9.558216002436685,
    "reward_min": -11.642317407708049,
    "reward_std": 3.700014175208206,
    "timesteps": 424468686,
    "learntime": 0.12097606994211674,
    "sampletime": 8.707968299044296,
    "best_max_mean": 6.671526063676533,
    "best_max": 9.96469847913712
  },
  {
    "gen": 1202,
    "reward_mean": 5.50086965739426,
    "reward_max": 9.48126994128423,
    "reward_min": -22.24352534671286,
    "reward_std": 4.955731613523878,
    "timesteps": 424826052,
    "learntime": 0.2698524999432266,
    "sampletime": 8.809697247110307,
    "best_max_mean": 6.671526063676533,
    "best_max": 9.96469847913712
  },
  {
    "gen": 1203,
    "reward_mean": 5.908377353820081,
    "reward_max": 10.08029807145375,
    "reward_min": -7.851964556236958,
    "reward_std": 3.7569279552451667,
    "timesteps": 425182848,
    "learntime": 0.2185633690096438,
    "sampletime": 8.738987371092662,
    "best_max_mean": 5.908377353820081,
    "best_max": 10.08029807145375
  },
  {
    "gen": 1204,
    "reward_mean": 7.363690229895711,
    "reward_max": 10.285054057808308,
    "reward_min": -3.106465122307066,
    "reward_std": 2.24693343653252,
    "timesteps": 425542908,
    "learntime": 0.27391363005153835,
    "sampletime": 8.868857498979196,
    "best_max_mean": 7.363690229895711,
    "best_max": 10.285054057808308
  },
  {
    "gen": 1205,
    "reward_mean": 7.118319231819562,
    "reward_max": 10.605337696456855,
    "reward_min": -10.93593882204203,
    "reward_std": 3.390271458791966,
    "timesteps": 425901207,
    "learntime": 0.21253199689090252,
    "sampletime": 8.739246012177318,
    "best_max_mean": 7.118319231819562,
    "best_max": 10.605337696456855
  },
  {
    "gen": 1206,
    "reward_mean": 7.260445294851586,
    "reward_max": 12.59933287675746,
    "reward_min": -2.3915227767852683,
    "reward_std": 3.0240684112766685,
    "timesteps": 426261321,
    "learntime": 0.27605636697262526,
    "sampletime": 8.809161914978176,
    "best_max_mean": 7.260445294851586,
    "best_max": 12.59933287675746
  },
  {
    "gen": 1207,
    "reward_mean": 5.500907236867741,
    "reward_max": 10.812795762430383,
    "reward_min": -15.929801647337124,
    "reward_std": 5.251330455728583,
    "timesteps": 426617478,
    "learntime": 0.22530214698053896,
    "sampletime": 8.827169606927782,
    "best_max_mean": 7.260445294851586,
    "best_max": 12.59933287675746
  },
  {
    "gen": 1208,
    "reward_mean": 6.100071618660775,
    "reward_max": 12.41409138054763,
    "reward_min": -16.17163740925378,
    "reward_std": 5.29202442770537,
    "timesteps": 426974286,
    "learntime": 0.27111413003876805,
    "sampletime": 8.76794243697077,
    "best_max_mean": 7.260445294851586,
    "best_max": 12.59933287675746
  },
  {
    "gen": 1209,
    "reward_mean": 7.494082141698936,
    "reward_max": 11.724371893767966,
    "reward_min": -2.1062233998990543,
    "reward_std": 3.443501505668061,
    "timesteps": 427332093,
    "learntime": 0.2148855021223426,
    "sampletime": 8.768613393884152,
    "best_max_mean": 7.260445294851586,
    "best_max": 12.59933287675746
  },
  {
    "gen": 1210,
    "reward_mean": 7.019037328487052,
    "reward_max": 11.405449223563524,
    "reward_min": -10.67396660285092,
    "reward_std": 4.421796555781827,
    "timesteps": 427688832,
    "learntime": 0.2865462121553719,
    "sampletime": 8.974625513888896,
    "best_max_mean": 7.260445294851586,
    "best_max": 12.59933287675746
  },
  {
    "gen": 1211,
    "reward_mean": 4.7756079284198885,
    "reward_max": 12.313244689449533,
    "reward_min": -31.119091836333006,
    "reward_std": 7.343595225662862,
    "timesteps": 428039154,
    "learntime": 0.21450153295882046,
    "sampletime": 9.04460405302234,
    "best_max_mean": 7.260445294851586,
    "best_max": 12.59933287675746
  },
  {
    "gen": 1212,
    "reward_mean": 2.7274655808170634,
    "reward_max": 11.668198509815598,
    "reward_min": -29.0271752733194,
    "reward_std": 9.622303411459374,
    "timesteps": 428385702,
    "learntime": 0.2500865950714797,
    "sampletime": 8.545508892973885,
    "best_max_mean": 7.260445294851586,
    "best_max": 12.59933287675746
  },
  {
    "gen": 1213,
    "reward_mean": 6.064440830173776,
    "reward_max": 11.796737746857671,
    "reward_min": -15.806357088304745,
    "reward_std": 5.693162268264705,
    "timesteps": 428740578,
    "learntime": 0.2305951970629394,
    "sampletime": 8.75223983102478,
    "best_max_mean": 7.260445294851586,
    "best_max": 12.59933287675746
  },
  {
    "gen": 1214,
    "reward_mean": 6.405279943473026,
    "reward_max": 13.405252633164775,
    "reward_min": -24.244200307377877,
    "reward_std": 6.600755871021771,
    "timesteps": 429094197,
    "learntime": 0.21660250308923423,
    "sampletime": 8.655087036080658,
    "best_max_mean": 6.405279943473026,
    "best_max": 13.405252633164775
  },
  {
    "gen": 1215,
    "reward_mean": 0.09171639235157358,
    "reward_max": 12.892326872374252,
    "reward_min": -36.51848137326835,
    "reward_std": 12.11743298635224,
    "timesteps": 429435990,
    "learntime": 0.2184344339184463,
    "sampletime": 8.66201317217201,
    "best_max_mean": 6.405279943473026,
    "best_max": 13.405252633164775
  },
  {
    "gen": 1216,
    "reward_mean": 3.950836090703869,
    "reward_max": 13.396896843659112,
    "reward_min": -37.89998322883691,
    "reward_std": 9.030154780168761,
    "timesteps": 429786555,
    "learntime": 0.21697564702481031,
    "sampletime": 8.74067411897704,
    "best_max_mean": 6.405279943473026,
    "best_max": 13.405252633164775
  },
  {
    "gen": 1217,
    "reward_mean": 3.199662833687383,
    "reward_max": 13.187005990152507,
    "reward_min": -18.116106872065842,
    "reward_std": 8.225291573724991,
    "timesteps": 430132734,
    "learntime": 0.21388262999244034,
    "sampletime": 8.516721178079024,
    "best_max_mean": 6.405279943473026,
    "best_max": 13.405252633164775
  },
  {
    "gen": 1218,
    "reward_mean": 7.921411124888962,
    "reward_max": 13.206489001903469,
    "reward_min": -16.773504886691548,
    "reward_std": 5.5112962552767035,
    "timesteps": 430489494,
    "learntime": 0.21956575312651694,
    "sampletime": 8.791661218972877,
    "best_max_mean": 6.405279943473026,
    "best_max": 13.405252633164775
  },
  {
    "gen": 1219,
    "reward_mean": 8.036233887825446,
    "reward_max": 12.155808036532507,
    "reward_min": -7.7215909790446124,
    "reward_std": 3.7679848736036314,
    "timesteps": 430846905,
    "learntime": 0.2627718630246818,
    "sampletime": 8.875148036982864,
    "best_max_mean": 6.405279943473026,
    "best_max": 13.405252633164775
  },
  {
    "gen": 1220,
    "reward_mean": 8.556176169184727,
    "reward_max": 12.681612739790138,
    "reward_min": -1.0718046375545938,
    "reward_std": 2.154139675936615,
    "timesteps": 431206536,
    "learntime": 0.22063432005234063,
    "sampletime": 8.760753900045529,
    "best_max_mean": 6.405279943473026,
    "best_max": 13.405252633164775
  },
  {
    "gen": 1221,
    "reward_mean": 7.629792806178919,
    "reward_max": 14.047149039099384,
    "reward_min": -11.573527179028718,
    "reward_std": 5.397638492820855,
    "timesteps": 431562360,
    "learntime": 0.26416387991048396,
    "sampletime": 8.720060121966526,
    "best_max_mean": 7.629792806178919,
    "best_max": 14.047149039099384
  },
  {
    "gen": 1222,
    "reward_mean": 3.448075840310378,
    "reward_max": 12.335632944465472,
    "reward_min": -37.1159150575845,
    "reward_std": 8.728380129675491,
    "timesteps": 431913858,
    "learntime": 0.21685770200565457,
    "sampletime": 8.728133795782924,
    "best_max_mean": 7.629792806178919,
    "best_max": 14.047149039099384
  },
  {
    "gen": 1223,
    "reward_mean": 8.014507342809758,
    "reward_max": 14.156212517037403,
    "reward_min": -10.233233177357098,
    "reward_std": 4.320013377649953,
    "timesteps": 432270237,
    "learntime": 0.25738081708550453,
    "sampletime": 8.736579792108387,
    "best_max_mean": 8.014507342809758,
    "best_max": 14.156212517037403
  },
  {
    "gen": 1224,
    "reward_mean": 9.605748384559073,
    "reward_max": 13.009903749519829,
    "reward_min": -0.827624303325798,
    "reward_std": 2.4299887021842803,
    "timesteps": 432629898,
    "learntime": 0.2159011480398476,
    "sampletime": 8.857646936085075,
    "best_max_mean": 8.014507342809758,
    "best_max": 14.156212517037403
  },
  {
    "gen": 1225,
    "reward_mean": 8.104495303503628,
    "reward_max": 15.684000579202829,
    "reward_min": -7.827475410575672,
    "reward_std": 4.004958424341848,
    "timesteps": 432987300,
    "learntime": 0.25508559006266296,
    "sampletime": 8.867101513082162,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1226,
    "reward_mean": 8.573051402552068,
    "reward_max": 13.235386423022254,
    "reward_min": -1.6914176969880728,
    "reward_std": 2.5691272769982683,
    "timesteps": 433346694,
    "learntime": 0.23410322004929185,
    "sampletime": 8.777107377070934,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1227,
    "reward_mean": 6.995749511933227,
    "reward_max": 12.254566476295809,
    "reward_min": -9.44953178384458,
    "reward_std": 4.236873873887629,
    "timesteps": 433702569,
    "learntime": 0.2611469419207424,
    "sampletime": 8.771322797052562,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1228,
    "reward_mean": 8.661733423159685,
    "reward_max": 14.086104854712064,
    "reward_min": -2.1657130237047912,
    "reward_std": 3.02421094578813,
    "timesteps": 434061210,
    "learntime": 0.2215232690796256,
    "sampletime": 8.957220691023394,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1229,
    "reward_mean": 9.421590618482828,
    "reward_max": 13.154432164893613,
    "reward_min": 6.692957439551578,
    "reward_std": 1.3334811125345953,
    "timesteps": 434421930,
    "learntime": 0.2600777889601886,
    "sampletime": 8.838732762960717,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1230,
    "reward_mean": 8.818784286843737,
    "reward_max": 11.470573871375311,
    "reward_min": -11.58659636448614,
    "reward_std": 3.0834690959873114,
    "timesteps": 434781303,
    "learntime": 0.22729752492159605,
    "sampletime": 8.831516922917217,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1231,
    "reward_mean": 9.31476087818155,
    "reward_max": 12.662530343757345,
    "reward_min": -1.3515233014089378,
    "reward_std": 2.4759505057896956,
    "timesteps": 435140811,
    "learntime": 0.25739789893850684,
    "sampletime": 8.855954584199935,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1232,
    "reward_mean": 8.22973088742608,
    "reward_max": 11.79189201800689,
    "reward_min": -1.1570981940550888,
    "reward_std": 2.4735591443680884,
    "timesteps": 435500538,
    "learntime": 0.21685421583242714,
    "sampletime": 8.744814760051668,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1233,
    "reward_mean": 9.528464259256548,
    "reward_max": 13.539244225046579,
    "reward_min": -0.9250277329913591,
    "reward_std": 2.4933276570340355,
    "timesteps": 435859971,
    "learntime": 0.2702996297739446,
    "sampletime": 8.863664228934795,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1234,
    "reward_mean": 9.518985616087422,
    "reward_max": 13.470084999109416,
    "reward_min": 1.5718790537847036,
    "reward_std": 2.177092314824406,
    "timesteps": 436219506,
    "learntime": 0.2179873848799616,
    "sampletime": 8.861468833871186,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1235,
    "reward_mean": 9.615166133858477,
    "reward_max": 15.127887316910671,
    "reward_min": -1.9244385183247383,
    "reward_std": 3.2030006206931185,
    "timesteps": 436577766,
    "learntime": 0.2565764698665589,
    "sampletime": 8.808687516022474,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1236,
    "reward_mean": 9.695444530865144,
    "reward_max": 14.932384297638206,
    "reward_min": -0.9214911281268396,
    "reward_std": 2.5508353858390755,
    "timesteps": 436937358,
    "learntime": 0.21568636689335108,
    "sampletime": 8.820263971108943,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1237,
    "reward_mean": 9.390909958695433,
    "reward_max": 15.041659144647628,
    "reward_min": -1.39938771916941,
    "reward_std": 3.6859254278099898,
    "timesteps": 437295759,
    "learntime": 0.26333969295956194,
    "sampletime": 8.872497834032401,
    "best_max_mean": 8.104495303503628,
    "best_max": 15.684000579202829
  },
  {
    "gen": 1238,
    "reward_mean": 9.789001834884267,
    "reward_max": 17.778905233481158,
    "reward_min": -9.813556308956878,
    "reward_std": 4.184477735335155,
    "timesteps": 437652729,
    "learntime": 0.22442282387055457,
    "sampletime": 8.775941130006686,
    "best_max_mean": 9.789001834884267,
    "best_max": 17.778905233481158
  },
  {
    "gen": 1239,
    "reward_mean": 9.891559321408176,
    "reward_max": 15.639454729144223,
    "reward_min": -5.520471451893779,
    "reward_std": 3.898735015852948,
    "timesteps": 438010995,
    "learntime": 0.2640711290296167,
    "sampletime": 8.844183553010225,
    "best_max_mean": 9.789001834884267,
    "best_max": 17.778905233481158
  },
  {
    "gen": 1240,
    "reward_mean": 10.033831622538818,
    "reward_max": 15.047920668704643,
    "reward_min": -0.9576333103874336,
    "reward_std": 3.458774987704388,
    "timesteps": 438369123,
    "learntime": 0.22547951014712453,
    "sampletime": 8.868825803045183,
    "best_max_mean": 9.789001834884267,
    "best_max": 17.778905233481158
  },
  {
    "gen": 1241,
    "reward_mean": 10.465611383887204,
    "reward_max": 15.380105733659791,
    "reward_min": -0.1010995525866778,
    "reward_std": 3.301596713355104,
    "timesteps": 438729459,
    "learntime": 0.2763324270490557,
    "sampletime": 8.843257643049583,
    "best_max_mean": 9.789001834884267,
    "best_max": 17.778905233481158
  },
  {
    "gen": 1242,
    "reward_mean": 10.667279728227111,
    "reward_max": 17.652909436781723,
    "reward_min": 0.13770496658451428,
    "reward_std": 4.08215900705388,
    "timesteps": 439086207,
    "learntime": 0.2163765369914472,
    "sampletime": 8.814116291934624,
    "best_max_mean": 9.789001834884267,
    "best_max": 17.778905233481158
  },
  {
    "gen": 1243,
    "reward_mean": 10.153893137757446,
    "reward_max": 15.887099109671187,
    "reward_min": -1.8873870431476565,
    "reward_std": 4.605138828559915,
    "timesteps": 439443330,
    "learntime": 0.2604202381335199,
    "sampletime": 8.78711102111265,
    "best_max_mean": 9.789001834884267,
    "best_max": 17.778905233481158
  },
  {
    "gen": 1244,
    "reward_mean": 8.766593153398805,
    "reward_max": 15.828739393837605,
    "reward_min": -4.629309427765713,
    "reward_std": 5.156301770866428,
    "timesteps": 439800087,
    "learntime": 0.22912275581620634,
    "sampletime": 8.801437485963106,
    "best_max_mean": 9.789001834884267,
    "best_max": 17.778905233481158
  },
  {
    "gen": 1245,
    "reward_mean": 10.959607498164743,
    "reward_max": 16.446347708842065,
    "reward_min": -0.4807840187947439,
    "reward_std": 4.137828119377893,
    "timesteps": 440157711,
    "learntime": 0.26628726604394615,
    "sampletime": 8.604314974043518,
    "best_max_mean": 9.789001834884267,
    "best_max": 17.778905233481158
  },
  {
    "gen": 1246,
    "reward_mean": 10.686285180607445,
    "reward_max": 15.902641305040254,
    "reward_min": -5.437267941885186,
    "reward_std": 4.456843675510481,
    "timesteps": 440514240,
    "learntime": 0.23254410992376506,
    "sampletime": 8.789522310951725,
    "best_max_mean": 9.789001834884267,
    "best_max": 17.778905233481158
  },
  {
    "gen": 1247,
    "reward_mean": 12.901590982524983,
    "reward_max": 18.42970352649637,
    "reward_min": 3.055604559492261,
    "reward_std": 3.3193605167385787,
    "timesteps": 440873754,
    "learntime": 0.219637094065547,
    "sampletime": 8.94266373408027,
    "best_max_mean": 12.901590982524983,
    "best_max": 18.42970352649637
  },
  {
    "gen": 1248,
    "reward_mean": 8.968665547593403,
    "reward_max": 16.39915571136402,
    "reward_min": -5.695310607933528,
    "reward_std": 5.408449848760461,
    "timesteps": 441228693,
    "learntime": 0.22293458902277052,
    "sampletime": 8.721044015837833,
    "best_max_mean": 12.901590982524983,
    "best_max": 18.42970352649637
  },
  {
    "gen": 1249,
    "reward_mean": 12.072317136000763,
    "reward_max": 17.823330585325596,
    "reward_min": -3.4502798918860473,
    "reward_std": 4.510948872585865,
    "timesteps": 441586251,
    "learntime": 0.21839496307075024,
    "sampletime": 8.811626568902284,
    "best_max_mean": 12.901590982524983,
    "best_max": 18.42970352649637
  },
  {
    "gen": 1250,
    "reward_mean": 11.82190730286159,
    "reward_max": 17.955431750432272,
    "reward_min": 2.5751298510744642,
    "reward_std": 4.007387862186593,
    "timesteps": 441943551,
    "learntime": 0.22669730405323207,
    "sampletime": 8.88910731789656,
    "best_max_mean": 12.901590982524983,
    "best_max": 18.42970352649637
  },
  {
    "gen": 1251,
    "reward_mean": 12.220182548860645,
    "reward_max": 17.310702941386914,
    "reward_min": 2.0803659667744223,
    "reward_std": 4.12005455250927,
    "timesteps": 442301115,
    "learntime": 0.27105033583939075,
    "sampletime": 8.820193513995036,
    "best_max_mean": 12.901590982524983,
    "best_max": 18.42970352649637
  },
  {
    "gen": 1252,
    "reward_mean": 9.484758082494363,
    "reward_max": 17.453846599485114,
    "reward_min": -7.69826655356317,
    "reward_std": 5.349221453841675,
    "timesteps": 442657425,
    "learntime": 0.22831250983290374,
    "sampletime": 8.767931395908818,
    "best_max_mean": 12.901590982524983,
    "best_max": 18.42970352649637
  },
  {
    "gen": 1253,
    "reward_mean": 9.02485362044758,
    "reward_max": 18.407557348327384,
    "reward_min": -51.424068709595524,
    "reward_std": 9.697257381385022,
    "timesteps": 443010645,
    "learntime": 0.24949505901895463,
    "sampletime": 8.685748983873054,
    "best_max_mean": 12.901590982524983,
    "best_max": 18.42970352649637
  },
  {
    "gen": 1254,
    "reward_mean": 11.907851254372813,
    "reward_max": 18.759208711989526,
    "reward_min": -11.937553352246248,
    "reward_std": 5.285873225283356,
    "timesteps": 443368863,
    "learntime": 0.22460380499251187,
    "sampletime": 8.887801337055862,
    "best_max_mean": 11.907851254372813,
    "best_max": 18.759208711989526
  },
  {
    "gen": 1255,
    "reward_mean": 12.05036557565971,
    "reward_max": 18.240665480628554,
    "reward_min": -4.190238112391349,
    "reward_std": 4.454319970150327,
    "timesteps": 443726910,
    "learntime": 0.27937821904197335,
    "sampletime": 8.853577289963141,
    "best_max_mean": 11.907851254372813,
    "best_max": 18.759208711989526
  },
  {
    "gen": 1256,
    "reward_mean": 11.021423785766727,
    "reward_max": 17.226271875918783,
    "reward_min": -8.836821818156753,
    "reward_std": 5.536047914953765,
    "timesteps": 444085776,
    "learntime": 0.2267552688717842,
    "sampletime": 8.756466761929914,
    "best_max_mean": 11.907851254372813,
    "best_max": 18.759208711989526
  },
  {
    "gen": 1257,
    "reward_mean": 10.862659105692018,
    "reward_max": 17.534533463241658,
    "reward_min": -6.938702682809289,
    "reward_std": 5.2141706530339915,
    "timesteps": 444442239,
    "learntime": 0.26812071818858385,
    "sampletime": 8.76011332613416,
    "best_max_mean": 11.907851254372813,
    "best_max": 18.759208711989526
  },
  {
    "gen": 1258,
    "reward_mean": 10.970887123932634,
    "reward_max": 20.58806354798273,
    "reward_min": -24.519691324077996,
    "reward_std": 7.176252781053017,
    "timesteps": 444799461,
    "learntime": 0.21964329318143427,
    "sampletime": 8.88739698799327,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1259,
    "reward_mean": 11.879162920576414,
    "reward_max": 17.26862046801816,
    "reward_min": 1.7198463585368808,
    "reward_std": 4.169243616788138,
    "timesteps": 445158771,
    "learntime": 0.26485446584410965,
    "sampletime": 9.00991084612906,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1260,
    "reward_mean": 12.072575114078354,
    "reward_max": 18.392210492892247,
    "reward_min": -3.8692272631601408,
    "reward_std": 4.7989678201663875,
    "timesteps": 445517586,
    "learntime": 0.225578990066424,
    "sampletime": 8.838416825979948,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1261,
    "reward_mean": 12.457497342685071,
    "reward_max": 19.210735792683963,
    "reward_min": -6.743366894740827,
    "reward_std": 5.149843228967494,
    "timesteps": 445877163,
    "learntime": 0.26066034217365086,
    "sampletime": 9.015602262923494,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1262,
    "reward_mean": 12.675745864539966,
    "reward_max": 18.283642153335016,
    "reward_min": 2.487231103745712,
    "reward_std": 2.4520244291198163,
    "timesteps": 446237637,
    "learntime": 0.2181618930771947,
    "sampletime": 8.843284945003688,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1263,
    "reward_mean": 11.613413084223495,
    "reward_max": 17.05953443552117,
    "reward_min": -0.42974369192564765,
    "reward_std": 3.9127620546681228,
    "timesteps": 446597169,
    "learntime": 0.26815884513780475,
    "sampletime": 8.779480896890163,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1264,
    "reward_mean": 10.018065170591475,
    "reward_max": 17.181933456329826,
    "reward_min": -6.783981453994235,
    "reward_std": 5.466494064070394,
    "timesteps": 446953821,
    "learntime": 0.21301383688114583,
    "sampletime": 8.820099188014865,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1265,
    "reward_mean": 10.34957186584283,
    "reward_max": 16.76408483546622,
    "reward_min": -13.9900238017814,
    "reward_std": 5.727937941113125,
    "timesteps": 447312984,
    "learntime": 0.2654284799937159,
    "sampletime": 8.770771624986082,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1266,
    "reward_mean": 12.58211068575694,
    "reward_max": 17.17663873771247,
    "reward_min": 3.9993972644881457,
    "reward_std": 2.6454491661404678,
    "timesteps": 447673641,
    "learntime": 0.22008463693782687,
    "sampletime": 8.815823110053316,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1267,
    "reward_mean": 11.784603586935578,
    "reward_max": 17.606741767400468,
    "reward_min": -2.419697508337175,
    "reward_std": 4.530409964821848,
    "timesteps": 448032186,
    "learntime": 0.2786651491187513,
    "sampletime": 8.8121442431584,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1268,
    "reward_mean": 8.070454394602674,
    "reward_max": 17.81926664299328,
    "reward_min": -26.685128537204232,
    "reward_std": 8.486130786526818,
    "timesteps": 448389345,
    "learntime": 0.22465130290947855,
    "sampletime": 8.755912594031543,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1269,
    "reward_mean": 11.273832192888754,
    "reward_max": 17.985610423899775,
    "reward_min": -0.026210095557021616,
    "reward_std": 4.545398878848652,
    "timesteps": 448748382,
    "learntime": 0.2709709699265659,
    "sampletime": 8.87701915600337,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1270,
    "reward_mean": 11.985213976958491,
    "reward_max": 18.065230088872894,
    "reward_min": 1.8376574320506938,
    "reward_std": 3.1314207726767953,
    "timesteps": 449108907,
    "learntime": 0.21398786804638803,
    "sampletime": 8.88853609492071,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1271,
    "reward_mean": 11.679716938362445,
    "reward_max": 17.70858042552682,
    "reward_min": -5.4013008953788875,
    "reward_std": 4.3292994625319485,
    "timesteps": 449468217,
    "learntime": 0.262713355012238,
    "sampletime": 8.816627251915634,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1272,
    "reward_mean": 11.6389585435838,
    "reward_max": 17.35046223184679,
    "reward_min": -5.452456967354842,
    "reward_std": 4.012245219777053,
    "timesteps": 449828019,
    "learntime": 0.22796981711871922,
    "sampletime": 8.847452390007675,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1273,
    "reward_mean": 12.92162839727835,
    "reward_max": 19.150336204290706,
    "reward_min": 2.9451119625970894,
    "reward_std": 2.831386882086964,
    "timesteps": 450187449,
    "learntime": 0.28212282597087324,
    "sampletime": 8.913290398893878,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1274,
    "reward_mean": 10.727582613382168,
    "reward_max": 17.213611195449307,
    "reward_min": -3.418418318932202,
    "reward_std": 4.81497992840523,
    "timesteps": 450546402,
    "learntime": 0.22039885097183287,
    "sampletime": 8.8294385781046,
    "best_max_mean": 10.970887123932634,
    "best_max": 20.58806354798273
  },
  {
    "gen": 1275,
    "reward_mean": 12.569818851254245,
    "reward_max": 20.93375787454318,
    "reward_min": -2.328094769801921,
    "reward_std": 4.035386954034525,
    "timesteps": 450907020,
    "learntime": 0.27619019499979913,
    "sampletime": 8.957765470957384,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1276,
    "reward_mean": 11.51745509580754,
    "reward_max": 16.66673630246341,
    "reward_min": 1.047111339824776,
    "reward_std": 3.8354920234647096,
    "timesteps": 451267056,
    "learntime": 0.28286391985602677,
    "sampletime": 8.82847601803951,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1277,
    "reward_mean": 9.467545741978565,
    "reward_max": 18.866831525497023,
    "reward_min": -10.19311730710395,
    "reward_std": 5.820484891254935,
    "timesteps": 451624743,
    "learntime": 0.2651628158055246,
    "sampletime": 8.955274168867618,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1278,
    "reward_mean": 9.02204617694525,
    "reward_max": 16.81184543300928,
    "reward_min": -15.017352940980345,
    "reward_std": 5.934757314808441,
    "timesteps": 451983828,
    "learntime": 0.2259316830895841,
    "sampletime": 8.626544710015878,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1279,
    "reward_mean": 10.956491966337587,
    "reward_max": 17.801010589449575,
    "reward_min": -7.809302098569318,
    "reward_std": 4.843470397153693,
    "timesteps": 452343813,
    "learntime": 0.21981605887413025,
    "sampletime": 8.73726858291775,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1280,
    "reward_mean": 11.122272985554643,
    "reward_max": 17.499063751314573,
    "reward_min": -9.108073192108845,
    "reward_std": 6.083152597740328,
    "timesteps": 452703159,
    "learntime": 0.2913416021037847,
    "sampletime": 8.85319667099975,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1281,
    "reward_mean": 10.62876134103883,
    "reward_max": 17.376493656757347,
    "reward_min": -8.752383283464674,
    "reward_std": 5.549702361445257,
    "timesteps": 453062373,
    "learntime": 0.22642063302919269,
    "sampletime": 8.919456521049142,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1282,
    "reward_mean": 12.117753369473158,
    "reward_max": 17.913041257079,
    "reward_min": 1.5777889506756357,
    "reward_std": 3.7172991081843203,
    "timesteps": 453421863,
    "learntime": 0.26334502710960805,
    "sampletime": 8.844301678938791,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1283,
    "reward_mean": 11.624814766572067,
    "reward_max": 17.921349273317233,
    "reward_min": 1.2614672551748227,
    "reward_std": 4.462865824146247,
    "timesteps": 453780717,
    "learntime": 0.2635988730471581,
    "sampletime": 8.79291770607233,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1284,
    "reward_mean": 8.715041762562826,
    "reward_max": 17.515868678810264,
    "reward_min": -17.99926211036897,
    "reward_std": 7.508485793840065,
    "timesteps": 454137411,
    "learntime": 0.26608330896124244,
    "sampletime": 8.794433939037845,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1285,
    "reward_mean": 9.762010651928254,
    "reward_max": 19.108305510088233,
    "reward_min": -13.3795728984176,
    "reward_std": 6.60488920227484,
    "timesteps": 454495935,
    "learntime": 0.21912229899317026,
    "sampletime": 8.959708807989955,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1286,
    "reward_mean": 12.20538336675595,
    "reward_max": 18.87675437023933,
    "reward_min": -5.4920020673748615,
    "reward_std": 4.669856330745342,
    "timesteps": 454854204,
    "learntime": 0.26624211808666587,
    "sampletime": 8.799180864123628,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1287,
    "reward_mean": 9.867642710121055,
    "reward_max": 18.51839200588591,
    "reward_min": -13.253529662557412,
    "reward_std": 5.85435621284235,
    "timesteps": 455212026,
    "learntime": 0.2211214241106063,
    "sampletime": 8.801398413954303,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1288,
    "reward_mean": 9.639394078271687,
    "reward_max": 17.246431049347542,
    "reward_min": -7.605356833146124,
    "reward_std": 5.552871974453084,
    "timesteps": 455571408,
    "learntime": 0.23680847301147878,
    "sampletime": 8.85541748511605,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1289,
    "reward_mean": 10.481098252687502,
    "reward_max": 17.197255244247074,
    "reward_min": -6.1972641989228885,
    "reward_std": 4.849051749769287,
    "timesteps": 455930553,
    "learntime": 0.22490706504322588,
    "sampletime": 8.745075997896492,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1290,
    "reward_mean": 12.190665880462419,
    "reward_max": 17.916115474199284,
    "reward_min": -12.038226761748472,
    "reward_std": 5.257872508052143,
    "timesteps": 456289890,
    "learntime": 0.2753720870241523,
    "sampletime": 8.794982667081058,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1291,
    "reward_mean": 12.720693358211228,
    "reward_max": 18.183829389854097,
    "reward_min": 3.109527864606315,
    "reward_std": 4.074563772041695,
    "timesteps": 456649071,
    "learntime": 0.21648108982481062,
    "sampletime": 8.746159510919824,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1292,
    "reward_mean": 12.420668704894062,
    "reward_max": 18.395341964604363,
    "reward_min": -6.615009049415781,
    "reward_std": 4.494091153361674,
    "timesteps": 457008153,
    "learntime": 0.27344734291546047,
    "sampletime": 8.80808932799846,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1293,
    "reward_mean": 10.513941040257595,
    "reward_max": 18.416193653007426,
    "reward_min": -8.63556905330916,
    "reward_std": 5.743769893365999,
    "timesteps": 457365816,
    "learntime": 0.22433928912505507,
    "sampletime": 8.816388116916642,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1294,
    "reward_mean": 10.320562870706343,
    "reward_max": 17.773888210042827,
    "reward_min": -13.110484075753702,
    "reward_std": 6.408942072872026,
    "timesteps": 457724976,
    "learntime": 0.2872015649918467,
    "sampletime": 8.817109625088051,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1295,
    "reward_mean": 14.792498009611029,
    "reward_max": 18.793079106899143,
    "reward_min": 11.1219433530617,
    "reward_std": 1.826837853381795,
    "timesteps": 458085696,
    "learntime": 0.22115538897924125,
    "sampletime": 8.770274271024391,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1296,
    "reward_mean": 11.366597590580739,
    "reward_max": 18.505515749149982,
    "reward_min": -5.955769462101727,
    "reward_std": 5.555193348003277,
    "timesteps": 458443836,
    "learntime": 0.27967055002227426,
    "sampletime": 8.797803622903302,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1297,
    "reward_mean": 12.163053545708916,
    "reward_max": 18.485673229190677,
    "reward_min": 1.724362634891414,
    "reward_std": 4.158498901361837,
    "timesteps": 458803119,
    "learntime": 0.2173070020508021,
    "sampletime": 8.820956747978926,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1298,
    "reward_mean": 12.533927677583844,
    "reward_max": 20.33134355738928,
    "reward_min": -1.323097402244025,
    "reward_std": 4.562502963462898,
    "timesteps": 459163374,
    "learntime": 0.25712857907637954,
    "sampletime": 8.849050308810547,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1299,
    "reward_mean": 8.640300622424675,
    "reward_max": 17.624021659696922,
    "reward_min": -4.790016261335103,
    "reward_std": 6.150155022990098,
    "timesteps": 459518781,
    "learntime": 0.22237866884097457,
    "sampletime": 8.98908075899817,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1300,
    "reward_mean": 11.665220044508331,
    "reward_max": 19.115067326844752,
    "reward_min": -4.243423197291458,
    "reward_std": 5.954152230799777,
    "timesteps": 459876483,
    "learntime": 0.27936926879920065,
    "sampletime": 8.88917011814192,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1301,
    "reward_mean": 10.031614990651935,
    "reward_max": 19.7795518548122,
    "reward_min": -22.482497269675758,
    "reward_std": 7.026580490486948,
    "timesteps": 460234341,
    "learntime": 0.2171760811470449,
    "sampletime": 8.77315684617497,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1302,
    "reward_mean": 9.793848063472613,
    "reward_max": 19.27360826784967,
    "reward_min": -10.521985969231437,
    "reward_std": 6.496173042363534,
    "timesteps": 460591857,
    "learntime": 0.268736561993137,
    "sampletime": 8.797662919852883,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1303,
    "reward_mean": 10.139732654760273,
    "reward_max": 17.460941153897718,
    "reward_min": -6.1000376374700656,
    "reward_std": 5.892409873121111,
    "timesteps": 460948923,
    "learntime": 0.2325157371815294,
    "sampletime": 8.81506834900938,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1304,
    "reward_mean": 11.689645941987099,
    "reward_max": 18.56950663730094,
    "reward_min": -4.0175205181909055,
    "reward_std": 5.986467436780501,
    "timesteps": 461307549,
    "learntime": 0.2787539029959589,
    "sampletime": 8.86318181687966,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1305,
    "reward_mean": 11.963669097583095,
    "reward_max": 19.91998821840565,
    "reward_min": -6.134070135060363,
    "reward_std": 6.0306150371377525,
    "timesteps": 461664735,
    "learntime": 0.22451212699525058,
    "sampletime": 8.608944105915725,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1306,
    "reward_mean": 9.688697376761649,
    "reward_max": 18.613316204455312,
    "reward_min": -6.930461045185271,
    "reward_std": 6.201360273697915,
    "timesteps": 462020319,
    "learntime": 0.2647395038511604,
    "sampletime": 8.836645262083039,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1307,
    "reward_mean": 11.956713586395932,
    "reward_max": 18.08863053196656,
    "reward_min": -3.493972749562201,
    "reward_std": 4.870810497871985,
    "timesteps": 462379143,
    "learntime": 0.2213315840344876,
    "sampletime": 8.891652969177812,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1308,
    "reward_mean": 10.43624796182607,
    "reward_max": 17.73642914017634,
    "reward_min": -15.162779894466935,
    "reward_std": 6.320296748964923,
    "timesteps": 462736500,
    "learntime": 0.25649352883920074,
    "sampletime": 8.850240034982562,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1309,
    "reward_mean": 10.118031730103736,
    "reward_max": 20.15370390566466,
    "reward_min": -7.196639867146697,
    "reward_std": 6.586860441775418,
    "timesteps": 463094436,
    "learntime": 0.23361600399948657,
    "sampletime": 8.744654261972755,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1310,
    "reward_mean": 12.825249778318575,
    "reward_max": 19.621862231746714,
    "reward_min": -4.636831401431916,
    "reward_std": 4.827992668588834,
    "timesteps": 463453464,
    "learntime": 0.29014552803710103,
    "sampletime": 8.68751013604924,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1311,
    "reward_mean": 10.491824829496714,
    "reward_max": 19.483995893349253,
    "reward_min": -12.037522772101294,
    "reward_std": 7.3425654466596715,
    "timesteps": 463810776,
    "learntime": 0.22787499194964767,
    "sampletime": 8.799778165994212,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1312,
    "reward_mean": 11.506124118470995,
    "reward_max": 18.611170579036393,
    "reward_min": -6.027797687195496,
    "reward_std": 5.403751759302733,
    "timesteps": 464168607,
    "learntime": 0.27638957486487925,
    "sampletime": 8.674073067959398,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1313,
    "reward_mean": 10.385729877230347,
    "reward_max": 19.94799449798567,
    "reward_min": -23.53592440782167,
    "reward_std": 7.55607580084194,
    "timesteps": 464524251,
    "learntime": 0.22290606214664876,
    "sampletime": 8.827134208986536,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1314,
    "reward_mean": 9.5997741001032,
    "reward_max": 19.644499151083764,
    "reward_min": -9.699733515774524,
    "reward_std": 7.4129283775710295,
    "timesteps": 464882625,
    "learntime": 0.24047248298302293,
    "sampletime": 8.726505324011669,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1315,
    "reward_mean": 10.527121470635173,
    "reward_max": 19.830677284181792,
    "reward_min": -7.277260632063687,
    "reward_std": 7.0909698521164435,
    "timesteps": 465238713,
    "learntime": 0.22992490511387587,
    "sampletime": 8.762296769069508,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1316,
    "reward_mean": 9.517014867695062,
    "reward_max": 19.010009105581513,
    "reward_min": -19.921966062426552,
    "reward_std": 7.674797113283418,
    "timesteps": 465596199,
    "learntime": 0.23259624210186303,
    "sampletime": 8.941347962012514,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1317,
    "reward_mean": 8.578484408272166,
    "reward_max": 19.14507622377079,
    "reward_min": -23.019293139688674,
    "reward_std": 8.335377901094601,
    "timesteps": 465951267,
    "learntime": 0.26084398198872805,
    "sampletime": 8.723921338096261,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1318,
    "reward_mean": 12.494082516034272,
    "reward_max": 19.250448698772797,
    "reward_min": -3.0320652950498617,
    "reward_std": 5.1393868984756805,
    "timesteps": 466310394,
    "learntime": 0.2565529029816389,
    "sampletime": 8.727259285049513,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1319,
    "reward_mean": 11.71735105268266,
    "reward_max": 18.98027400918672,
    "reward_min": -15.983972795682748,
    "reward_std": 6.248409816704927,
    "timesteps": 466667295,
    "learntime": 0.22115743113681674,
    "sampletime": 8.729654571972787,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1320,
    "reward_mean": 11.986036422931676,
    "reward_max": 18.840812413633977,
    "reward_min": -14.2183726193087,
    "reward_std": 5.515507944874914,
    "timesteps": 467023710,
    "learntime": 0.22504996112547815,
    "sampletime": 8.81247379584238,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1321,
    "reward_mean": 11.493364241903866,
    "reward_max": 18.68926326368202,
    "reward_min": -3.3675427360752974,
    "reward_std": 5.209945340803554,
    "timesteps": 467378937,
    "learntime": 0.2671292161103338,
    "sampletime": 8.838887821882963,
    "best_max_mean": 12.569818851254245,
    "best_max": 20.93375787454318
  },
  {
    "gen": 1322,
    "reward_mean": 12.496272878874564,
    "reward_max": 21.490706829476746,
    "reward_min": -4.451157597041777,
    "reward_std": 5.723821143964822,
    "timesteps": 467737806,
    "learntime": 0.22479161503724754,
    "sampletime": 8.788899186998606,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1323,
    "reward_mean": 11.960232811825556,
    "reward_max": 17.54127658273546,
    "reward_min": -5.679562703438221,
    "reward_std": 5.45533848086262,
    "timesteps": 468095565,
    "learntime": 0.27032186393626034,
    "sampletime": 8.820538307074457,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1324,
    "reward_mean": 12.152839782505174,
    "reward_max": 19.366048474505074,
    "reward_min": 0.3185641751201315,
    "reward_std": 4.5457152625639115,
    "timesteps": 468455421,
    "learntime": 0.2150409419555217,
    "sampletime": 8.700031277956441,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1325,
    "reward_mean": 11.746260412107304,
    "reward_max": 20.199369297097682,
    "reward_min": -6.128159935635543,
    "reward_std": 5.790790302327564,
    "timesteps": 468814524,
    "learntime": 0.2782291939947754,
    "sampletime": 8.892643077066168,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1326,
    "reward_mean": 12.300182737877634,
    "reward_max": 18.798690534334376,
    "reward_min": -6.402089324917393,
    "reward_std": 5.130596776629867,
    "timesteps": 469172271,
    "learntime": 0.22985761892050505,
    "sampletime": 8.8202367820777,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1327,
    "reward_mean": 11.6939502833708,
    "reward_max": 18.469362942378435,
    "reward_min": -4.106092772107913,
    "reward_std": 5.232548198431778,
    "timesteps": 469531236,
    "learntime": 0.2791146670933813,
    "sampletime": 8.878570090048015,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1328,
    "reward_mean": 9.400192112726671,
    "reward_max": 18.24677929789477,
    "reward_min": -15.106015103629248,
    "reward_std": 7.95365773613863,
    "timesteps": 469887186,
    "learntime": 0.2252995208837092,
    "sampletime": 8.83783346391283,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1329,
    "reward_mean": 11.657142919543588,
    "reward_max": 17.745113023140483,
    "reward_min": -5.153008207010295,
    "reward_std": 5.308760066645132,
    "timesteps": 470246136,
    "learntime": 0.2799514790531248,
    "sampletime": 8.799420719966292,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1330,
    "reward_mean": 11.55431278936032,
    "reward_max": 20.38560882441945,
    "reward_min": -4.548957264392154,
    "reward_std": 4.3718878684099,
    "timesteps": 470605701,
    "learntime": 0.22641212004236877,
    "sampletime": 8.90207201987505,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1331,
    "reward_mean": 13.270753536085683,
    "reward_max": 18.396164627224305,
    "reward_min": 0.7963674494725042,
    "reward_std": 3.8915531882437353,
    "timesteps": 470965077,
    "learntime": 0.2829388710670173,
    "sampletime": 8.81335604400374,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1332,
    "reward_mean": 12.75957709066217,
    "reward_max": 18.272275769218776,
    "reward_min": -0.7201171027898696,
    "reward_std": 4.051670329018093,
    "timesteps": 471325122,
    "learntime": 0.22999925795011222,
    "sampletime": 8.929927546996623,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1333,
    "reward_mean": 10.545201031589478,
    "reward_max": 18.26005239608859,
    "reward_min": -6.325439292930463,
    "reward_std": 6.496191603362775,
    "timesteps": 471682317,
    "learntime": 0.261077594012022,
    "sampletime": 8.819003693992272,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1334,
    "reward_mean": 11.04715083775518,
    "reward_max": 19.56009751000965,
    "reward_min": -11.388902036522547,
    "reward_std": 6.678895891132325,
    "timesteps": 472037865,
    "learntime": 0.23205023095943034,
    "sampletime": 8.991564936935902,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1335,
    "reward_mean": 12.495146693685173,
    "reward_max": 20.157382923393563,
    "reward_min": -4.440365663200452,
    "reward_std": 5.416385869254642,
    "timesteps": 472394514,
    "learntime": 0.2769505048636347,
    "sampletime": 8.784656040137634,
    "best_max_mean": 12.496272878874564,
    "best_max": 21.490706829476746
  },
  {
    "gen": 1336,
    "reward_mean": 11.91465524238702,
    "reward_max": 21.981763082773373,
    "reward_min": -19.708418599485114,
    "reward_std": 6.171669816133927,
    "timesteps": 472753116,
    "learntime": 0.23705163202248514,
    "sampletime": 8.90918809408322,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1337,
    "reward_mean": 13.47740401138271,
    "reward_max": 20.284245326741118,
    "reward_min": 2.9014310308654476,
    "reward_std": 3.5134666719488035,
    "timesteps": 473112516,
    "learntime": 0.26652134000323713,
    "sampletime": 8.852876883931458,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1338,
    "reward_mean": 13.464605912127892,
    "reward_max": 19.603269790953465,
    "reward_min": 2.5500394080151065,
    "reward_std": 3.8731250534550674,
    "timesteps": 473472003,
    "learntime": 0.22651453502476215,
    "sampletime": 8.83917091996409,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1339,
    "reward_mean": 12.8316587515667,
    "reward_max": 19.121503334291358,
    "reward_min": -2.08908196209196,
    "reward_std": 4.214872928510084,
    "timesteps": 473831577,
    "learntime": 0.2752306559123099,
    "sampletime": 8.841358373872936,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1340,
    "reward_mean": 11.034424499678614,
    "reward_max": 19.80876371196064,
    "reward_min": -5.221997222217568,
    "reward_std": 5.882761496530179,
    "timesteps": 474187632,
    "learntime": 0.23208845197223127,
    "sampletime": 8.805781304836273,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1341,
    "reward_mean": 12.880539472571211,
    "reward_max": 18.403268172052442,
    "reward_min": 1.9041285956574727,
    "reward_std": 4.003557317446929,
    "timesteps": 474546738,
    "learntime": 0.281816435046494,
    "sampletime": 8.913967658998445,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1342,
    "reward_mean": 13.65206253482411,
    "reward_max": 21.217660338821144,
    "reward_min": 3.152417784939499,
    "reward_std": 4.231144861089938,
    "timesteps": 474906372,
    "learntime": 0.24415339180268347,
    "sampletime": 8.788690760033205,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1343,
    "reward_mean": 10.97562084323173,
    "reward_max": 18.172654394917316,
    "reward_min": -6.191355626515082,
    "reward_std": 6.215816207491902,
    "timesteps": 475262490,
    "learntime": 0.28453847696073353,
    "sampletime": 8.910856156144291,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1344,
    "reward_mean": 12.9953000540489,
    "reward_max": 19.711508392261088,
    "reward_min": -1.3495816504582778,
    "reward_std": 4.285453239058595,
    "timesteps": 475621614,
    "learntime": 0.22481138701550663,
    "sampletime": 8.78946195798926,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1345,
    "reward_mean": 11.486334069936396,
    "reward_max": 18.933202731261385,
    "reward_min": -5.2531597384917825,
    "reward_std": 5.461751946780661,
    "timesteps": 475980705,
    "learntime": 0.28089068713597953,
    "sampletime": 8.756707650842145,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1346,
    "reward_mean": 14.324049972777448,
    "reward_max": 20.150437303522434,
    "reward_min": 3.1522677249317463,
    "reward_std": 3.941419537637531,
    "timesteps": 476339232,
    "learntime": 0.23064126609824598,
    "sampletime": 8.812734325183555,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1347,
    "reward_mean": 12.370947146789504,
    "reward_max": 20.002552011064395,
    "reward_min": -2.7070939995788272,
    "reward_std": 5.76870242202573,
    "timesteps": 476697873,
    "learntime": 0.2639460538048297,
    "sampletime": 8.920416374923661,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1348,
    "reward_mean": 12.40078796832299,
    "reward_max": 19.428461956248313,
    "reward_min": -2.1667917265405077,
    "reward_std": 5.062617595978928,
    "timesteps": 477055641,
    "learntime": 0.22887897491455078,
    "sampletime": 8.830216438975185,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1349,
    "reward_mean": 10.789123937413656,
    "reward_max": 18.99844204894362,
    "reward_min": -5.9463639572672005,
    "reward_std": 5.626354141902554,
    "timesteps": 477414189,
    "learntime": 0.2757605218794197,
    "sampletime": 8.914956940105185,
    "best_max_mean": 11.91465524238702,
    "best_max": 21.981763082773373
  },
  {
    "gen": 1350,
    "reward_mean": 14.81289085950671,
    "reward_max": 22.10944241257807,
    "reward_min": -0.9408641029978365,
    "reward_std": 5.14117012545048,
    "timesteps": 477773124,
    "learntime": 0.2304810960777104,
    "sampletime": 8.861769055016339,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1351,
    "reward_mean": 12.813096347922254,
    "reward_max": 20.29799214815967,
    "reward_min": -4.223148918427557,
    "reward_std": 5.2645639268953115,
    "timesteps": 478130364,
    "learntime": 0.22283915313892066,
    "sampletime": 8.87494921288453,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1352,
    "reward_mean": 13.664508258834068,
    "reward_max": 20.748446945566684,
    "reward_min": -6.12429852574838,
    "reward_std": 4.862700234084247,
    "timesteps": 478489473,
    "learntime": 0.220809793099761,
    "sampletime": 8.818272865843028,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1353,
    "reward_mean": 11.079575166476497,
    "reward_max": 19.139787392083132,
    "reward_min": -4.579140839805574,
    "reward_std": 5.633084320621879,
    "timesteps": 478845735,
    "learntime": 0.22191635984927416,
    "sampletime": 8.851031523896381,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1354,
    "reward_mean": 9.378640173344536,
    "reward_max": 20.200674903359165,
    "reward_min": -15.880993674095606,
    "reward_std": 8.067984525144452,
    "timesteps": 479200797,
    "learntime": 0.22292197006754577,
    "sampletime": 8.762225094018504,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1355,
    "reward_mean": 12.82116397716819,
    "reward_max": 21.24790829305614,
    "reward_min": -3.1547780151507125,
    "reward_std": 5.529023548400357,
    "timesteps": 479556927,
    "learntime": 0.23632925003767014,
    "sampletime": 8.74694380001165,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1356,
    "reward_mean": 13.94690747393239,
    "reward_max": 21.133319664683018,
    "reward_min": -1.8305187010908364,
    "reward_std": 5.291274036295221,
    "timesteps": 479914584,
    "learntime": 0.26632276899181306,
    "sampletime": 8.936495453119278,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1357,
    "reward_mean": 14.390399433785298,
    "reward_max": 21.70427826523541,
    "reward_min": 0.9821195022280579,
    "reward_std": 4.125911602317271,
    "timesteps": 480273552,
    "learntime": 0.22746359813027084,
    "sampletime": 8.815537020098418,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1358,
    "reward_mean": 12.684227046090308,
    "reward_max": 20.14844971793354,
    "reward_min": -10.363700564449768,
    "reward_std": 5.236048198285994,
    "timesteps": 480631956,
    "learntime": 0.2283780979923904,
    "sampletime": 8.959846265148371,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1359,
    "reward_mean": 13.487182833181112,
    "reward_max": 19.156847393806938,
    "reward_min": -11.830152050930668,
    "reward_std": 5.952646757536464,
    "timesteps": 480990477,
    "learntime": 0.2719435861799866,
    "sampletime": 8.89282852690667,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1360,
    "reward_mean": 15.8063627756957,
    "reward_max": 20.53251566601543,
    "reward_min": 5.947055426659062,
    "reward_std": 2.8002195073695875,
    "timesteps": 481350243,
    "learntime": 0.22829211503267288,
    "sampletime": 8.90772063890472,
    "best_max_mean": 14.81289085950671,
    "best_max": 22.10944241257807
  },
  {
    "gen": 1361,
    "reward_mean": 13.521853280867589,
    "reward_max": 22.528075309643153,
    "reward_min": -1.5903028054109996,
    "reward_std": 5.179786869063126,
    "timesteps": 481705653,
    "learntime": 0.23804220603778958,
    "sampletime": 8.784318848978728,
    "best_max_mean": 13.521853280867589,
    "best_max": 22.528075309643153
  },
  {
    "gen": 1362,
    "reward_mean": 14.643223970689206,
    "reward_max": 20.9881972028648,
    "reward_min": 2.240954224056782,
    "reward_std": 4.0967639404072935,
    "timesteps": 482063418,
    "learntime": 0.27620955696329474,
    "sampletime": 8.771627636160702,
    "best_max_mean": 13.521853280867589,
    "best_max": 22.528075309643153
  },
  {
    "gen": 1363,
    "reward_mean": 14.855354668452696,
    "reward_max": 23.012137284075088,
    "reward_min": -7.6170714725643265,
    "reward_std": 5.689645497443859,
    "timesteps": 482420967,
    "learntime": 0.23290584003552794,
    "sampletime": 8.899937463924289,
    "best_max_mean": 14.855354668452696,
    "best_max": 23.012137284075088
  },
  {
    "gen": 1364,
    "reward_mean": 15.866799605283624,
    "reward_max": 21.412396952174745,
    "reward_min": 1.2780024375083963,
    "reward_std": 4.74410841338047,
    "timesteps": 482780463,
    "learntime": 0.29487589513882995,
    "sampletime": 8.737757764058188,
    "best_max_mean": 14.855354668452696,
    "best_max": 23.012137284075088
  },
  {
    "gen": 1365,
    "reward_mean": 14.102434891600755,
    "reward_max": 23.655024110928125,
    "reward_min": 1.4470898034827162,
    "reward_std": 4.684860091007552,
    "timesteps": 483137523,
    "learntime": 0.2233923429157585,
    "sampletime": 8.856908710906282,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1366,
    "reward_mean": 14.337215471726358,
    "reward_max": 20.120458888831013,
    "reward_min": -3.2133906163960866,
    "reward_std": 4.010410401276914,
    "timesteps": 483496968,
    "learntime": 0.2988833310082555,
    "sampletime": 8.887581029906869,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1367,
    "reward_mean": 15.449634085662911,
    "reward_max": 21.152874406663212,
    "reward_min": 1.0434382982850992,
    "reward_std": 4.929596305312686,
    "timesteps": 483856683,
    "learntime": 0.2353474071715027,
    "sampletime": 8.891921454109251,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1368,
    "reward_mean": 16.38979246177747,
    "reward_max": 20.547896806491543,
    "reward_min": 12.414915246673802,
    "reward_std": 1.9418334774219277,
    "timesteps": 484217403,
    "learntime": 0.27944062696769834,
    "sampletime": 8.840595845133066,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1369,
    "reward_mean": 15.02779882091247,
    "reward_max": 20.71792972983906,
    "reward_min": -0.9178774431719702,
    "reward_std": 4.8976401722456675,
    "timesteps": 484575159,
    "learntime": 0.22394143603742123,
    "sampletime": 8.878009062027559,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1370,
    "reward_mean": 15.063788035339961,
    "reward_max": 22.402810606992308,
    "reward_min": -11.998832537654163,
    "reward_std": 6.060690528776565,
    "timesteps": 484931739,
    "learntime": 0.27479782700538635,
    "sampletime": 8.890278530074283,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1371,
    "reward_mean": 15.174023434613336,
    "reward_max": 21.08745158065093,
    "reward_min": -3.146227725453429,
    "reward_std": 4.82887178792956,
    "timesteps": 485289366,
    "learntime": 0.2273102211765945,
    "sampletime": 8.872921236092225,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1372,
    "reward_mean": 17.113155550224732,
    "reward_max": 22.02888059046947,
    "reward_min": 2.307624231492001,
    "reward_std": 3.674112663972678,
    "timesteps": 485648895,
    "learntime": 0.26403413293883204,
    "sampletime": 8.761628260836005,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1373,
    "reward_mean": 16.16832091267704,
    "reward_max": 21.726481095527888,
    "reward_min": 4.067492305503638,
    "reward_std": 3.9572197743054423,
    "timesteps": 486008343,
    "learntime": 0.2334384119603783,
    "sampletime": 8.714184292824939,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1374,
    "reward_mean": 17.12131011919613,
    "reward_max": 21.979245240305314,
    "reward_min": 9.106063275019444,
    "reward_std": 3.0676610327324703,
    "timesteps": 486368604,
    "learntime": 0.27499617100693285,
    "sampletime": 8.85133009403944,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1375,
    "reward_mean": 14.596371267627909,
    "reward_max": 20.206431445651553,
    "reward_min": -3.7583140857821125,
    "reward_std": 5.581167322158259,
    "timesteps": 486726021,
    "learntime": 0.22609000210650265,
    "sampletime": 8.78725103288889,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1376,
    "reward_mean": 16.41871197386544,
    "reward_max": 22.39298561261966,
    "reward_min": -2.6596625762582424,
    "reward_std": 5.840802415754433,
    "timesteps": 487082076,
    "learntime": 0.2838127580471337,
    "sampletime": 8.767422887030989,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1377,
    "reward_mean": 17.83583328674242,
    "reward_max": 22.323584685341995,
    "reward_min": 8.919045188062057,
    "reward_std": 3.758441091870466,
    "timesteps": 487441161,
    "learntime": 0.23116941191256046,
    "sampletime": 8.972982204053551,
    "best_max_mean": 14.102434891600755,
    "best_max": 23.655024110928125
  },
  {
    "gen": 1378,
    "reward_mean": 17.02464808415712,
    "reward_max": 23.91847253765201,
    "reward_min": 6.781648663232435,
    "reward_std": 4.326776000077871,
    "timesteps": 487797480,
    "learntime": 0.27569713699631393,
    "sampletime": 8.898719936842099,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1379,
    "reward_mean": 17.802524769003536,
    "reward_max": 21.029899158715526,
    "reward_min": 8.249817450283881,
    "reward_std": 2.859425745290137,
    "timesteps": 488157063,
    "learntime": 0.24846825911663473,
    "sampletime": 8.980698220198974,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1380,
    "reward_mean": 15.507014733184441,
    "reward_max": 23.696473127470885,
    "reward_min": -1.7304707928302019,
    "reward_std": 6.179774505674579,
    "timesteps": 488511564,
    "learntime": 0.2912110129836947,
    "sampletime": 8.8992554389406,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1381,
    "reward_mean": 15.993029696192885,
    "reward_max": 23.26206633559841,
    "reward_min": -0.08956225056935065,
    "reward_std": 5.280413972930269,
    "timesteps": 488867565,
    "learntime": 0.21959366113878787,
    "sampletime": 8.818321263184771,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1382,
    "reward_mean": 17.458507805071157,
    "reward_max": 23.08405790389797,
    "reward_min": 7.338075839551456,
    "reward_std": 4.124128115348893,
    "timesteps": 489224379,
    "learntime": 0.2981624489184469,
    "sampletime": 8.851688159862533,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1383,
    "reward_mean": 13.406143228892656,
    "reward_max": 23.142502771775142,
    "reward_min": -20.28232343034875,
    "reward_std": 8.787472114493877,
    "timesteps": 489575205,
    "learntime": 0.2279170227702707,
    "sampletime": 8.792863277019933,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1384,
    "reward_mean": 13.869203911202066,
    "reward_max": 23.712113491873335,
    "reward_min": -31.74527051533347,
    "reward_std": 9.876141848361954,
    "timesteps": 489929793,
    "learntime": 0.27903115819208324,
    "sampletime": 8.813563676085323,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1385,
    "reward_mean": 12.163149566396015,
    "reward_max": 21.940585678423105,
    "reward_min": -11.755760331511157,
    "reward_std": 8.000389609916253,
    "timesteps": 490279053,
    "learntime": 0.22891590907238424,
    "sampletime": 8.818060363875702,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1386,
    "reward_mean": 15.641543636834262,
    "reward_max": 22.46194906811456,
    "reward_min": -1.3927730527233797,
    "reward_std": 6.749832076985694,
    "timesteps": 490634157,
    "learntime": 0.22486537205986679,
    "sampletime": 8.888283009873703,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1387,
    "reward_mean": 15.933138684443115,
    "reward_max": 22.636020849783424,
    "reward_min": 0.564998643201146,
    "reward_std": 5.2979333401990205,
    "timesteps": 490992093,
    "learntime": 0.2369076511822641,
    "sampletime": 8.93632838409394,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1388,
    "reward_mean": 15.921104573531498,
    "reward_max": 22.300786498096894,
    "reward_min": -4.06740872667058,
    "reward_std": 5.354212149667564,
    "timesteps": 491348226,
    "learntime": 0.22585690510459244,
    "sampletime": 8.828805765137076,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1389,
    "reward_mean": 16.057576734128155,
    "reward_max": 22.97916100877001,
    "reward_min": -4.016794186810412,
    "reward_std": 6.418088472514767,
    "timesteps": 491703963,
    "learntime": 0.2913383231498301,
    "sampletime": 8.851913063088432,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1390,
    "reward_mean": 16.220027752910532,
    "reward_max": 21.826118901908174,
    "reward_min": 6.569963496615819,
    "reward_std": 3.932158524492935,
    "timesteps": 492060777,
    "learntime": 0.23269608919508755,
    "sampletime": 8.931097930064425,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1391,
    "reward_mean": 17.42723297342875,
    "reward_max": 22.665275101683974,
    "reward_min": 6.953333262672071,
    "reward_std": 4.150278907032598,
    "timesteps": 492417507,
    "learntime": 0.2373205740004778,
    "sampletime": 8.829004382016137,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1392,
    "reward_mean": 17.89637306728914,
    "reward_max": 22.087534925872177,
    "reward_min": -1.079451151405617,
    "reward_std": 3.887106707237152,
    "timesteps": 492776079,
    "learntime": 0.23596568894572556,
    "sampletime": 8.8388531091623,
    "best_max_mean": 17.02464808415712,
    "best_max": 23.91847253765201
  },
  {
    "gen": 1393,
    "reward_mean": 17.889918623988216,
    "reward_max": 23.95931725036071,
    "reward_min": 7.783267504426251,
    "reward_std": 3.0909100187005754,
    "timesteps": 493134987,
    "learntime": 0.23368013580329716,
    "sampletime": 8.964168587932363,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1394,
    "reward_mean": 15.774560457740394,
    "reward_max": 21.590477680137273,
    "reward_min": -2.140157117406052,
    "reward_std": 5.464727812122886,
    "timesteps": 493491327,
    "learntime": 0.23236509505659342,
    "sampletime": 8.777186712948605,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1395,
    "reward_mean": 15.074873164605343,
    "reward_max": 21.757215527630635,
    "reward_min": -3.095165819335361,
    "reward_std": 6.058284644558118,
    "timesteps": 493845804,
    "learntime": 0.22283047693781555,
    "sampletime": 8.764780660858378,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1396,
    "reward_mean": 14.171345476661575,
    "reward_max": 20.47778642625296,
    "reward_min": -20.99067715552607,
    "reward_std": 6.616203834976266,
    "timesteps": 494199837,
    "learntime": 0.24152011889964342,
    "sampletime": 8.860450842883438,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1397,
    "reward_mean": 15.689704956957863,
    "reward_max": 21.01122379346017,
    "reward_min": -0.3579206502234387,
    "reward_std": 4.6752526902369045,
    "timesteps": 494555757,
    "learntime": 0.22896048915572464,
    "sampletime": 8.794578929897398,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1398,
    "reward_mean": 17.605594250067252,
    "reward_max": 20.997601043217756,
    "reward_min": 8.478202268763466,
    "reward_std": 2.5544181629523943,
    "timesteps": 494916447,
    "learntime": 0.237093694973737,
    "sampletime": 8.91988313011825,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1399,
    "reward_mean": 15.833220898582372,
    "reward_max": 21.436453383006718,
    "reward_min": 5.06773930360478,
    "reward_std": 4.211914167506652,
    "timesteps": 495272739,
    "learntime": 0.2434106389991939,
    "sampletime": 8.860008532181382,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1400,
    "reward_mean": 14.73592918560601,
    "reward_max": 22.356987368470676,
    "reward_min": -10.45320868646054,
    "reward_std": 5.8944048628994565,
    "timesteps": 495627879,
    "learntime": 0.22218000306747854,
    "sampletime": 8.983121808152646,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1401,
    "reward_mean": 16.32532718314073,
    "reward_max": 22.078432329648145,
    "reward_min": -0.579717598034124,
    "reward_std": 3.9883110937894277,
    "timesteps": 495986109,
    "learntime": 0.11305014090612531,
    "sampletime": 8.937043105950579,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1402,
    "reward_mean": 15.433977019005965,
    "reward_max": 20.93341363965054,
    "reward_min": 5.947166438760397,
    "reward_std": 3.8252286990957347,
    "timesteps": 496343367,
    "learntime": 0.23719671508297324,
    "sampletime": 8.919379081111401,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1403,
    "reward_mean": 15.038465396474155,
    "reward_max": 21.240439501781527,
    "reward_min": 3.3515616522539244,
    "reward_std": 4.46447621523597,
    "timesteps": 496700502,
    "learntime": 0.22100493405014277,
    "sampletime": 8.980408709961921,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1404,
    "reward_mean": 15.923561027671322,
    "reward_max": 20.92660926888824,
    "reward_min": -0.3601393107480136,
    "reward_std": 4.206752082540838,
    "timesteps": 497056857,
    "learntime": 0.23181736189872026,
    "sampletime": 8.830279198940843,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1405,
    "reward_mean": 16.576171749731465,
    "reward_max": 21.811646596013528,
    "reward_min": 4.179849024883212,
    "reward_std": 3.9051774332488094,
    "timesteps": 497414289,
    "learntime": 0.23638253612443805,
    "sampletime": 8.860115119954571,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1406,
    "reward_mean": 15.987648529043053,
    "reward_max": 21.180542988235228,
    "reward_min": -0.46884315596385373,
    "reward_std": 4.4858333639336285,
    "timesteps": 497771943,
    "learntime": 0.23628981108777225,
    "sampletime": 8.88501044199802,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1407,
    "reward_mean": 15.837219101291556,
    "reward_max": 20.99899742681758,
    "reward_min": -0.2930308645308912,
    "reward_std": 4.247080627945206,
    "timesteps": 498129495,
    "learntime": 0.2397840318735689,
    "sampletime": 8.953727933112532,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1408,
    "reward_mean": 14.984896011633237,
    "reward_max": 21.353642236035675,
    "reward_min": -1.738666113303533,
    "reward_std": 5.3242266654724855,
    "timesteps": 498483285,
    "learntime": 0.23045941907912493,
    "sampletime": 8.974279567133635,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1409,
    "reward_mean": 16.38327849255429,
    "reward_max": 21.445435509243733,
    "reward_min": -0.5233218606145175,
    "reward_std": 4.758421117900875,
    "timesteps": 498840846,
    "learntime": 0.23787698009982705,
    "sampletime": 8.913247670978308,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1410,
    "reward_mean": 13.835130004041122,
    "reward_max": 22.3894653211764,
    "reward_min": -11.373760889646796,
    "reward_std": 7.33293132383179,
    "timesteps": 499191180,
    "learntime": 0.24493886413984,
    "sampletime": 8.768504819832742,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1411,
    "reward_mean": 17.440731708380664,
    "reward_max": 21.99955444330247,
    "reward_min": 4.988661633206193,
    "reward_std": 3.792180442160882,
    "timesteps": 499549467,
    "learntime": 0.23519864887930453,
    "sampletime": 9.052232390968129,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1412,
    "reward_mean": 16.235981695248558,
    "reward_max": 22.49677248019725,
    "reward_min": -3.671547155552122,
    "reward_std": 5.228452295007767,
    "timesteps": 499903653,
    "learntime": 0.24315841891802847,
    "sampletime": 8.888409225037321,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1413,
    "reward_mean": 16.748674274321807,
    "reward_max": 21.73173723885944,
    "reward_min": -1.191838534891657,
    "reward_std": 4.643436743534887,
    "timesteps": 500262099,
    "learntime": 0.23404629318974912,
    "sampletime": 8.919955219840631,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1414,
    "reward_mean": 17.62755942151206,
    "reward_max": 22.27997337340881,
    "reward_min": -0.4971788605872676,
    "reward_std": 4.602902246789384,
    "timesteps": 500619417,
    "learntime": 0.23652218305505812,
    "sampletime": 8.946392540121451,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1415,
    "reward_mean": 14.84302018214369,
    "reward_max": 21.543072664202043,
    "reward_min": -11.040113107483998,
    "reward_std": 7.383362008808188,
    "timesteps": 500970066,
    "learntime": 0.23134910687804222,
    "sampletime": 8.89266038686037,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1416,
    "reward_mean": 16.89451795894494,
    "reward_max": 22.274043514739862,
    "reward_min": -9.811131245513087,
    "reward_std": 6.546110193926787,
    "timesteps": 501325191,
    "learntime": 0.2574010358657688,
    "sampletime": 8.877592643955722,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1417,
    "reward_mean": 14.757676018547553,
    "reward_max": 22.88257357215325,
    "reward_min": 0.3478442296877233,
    "reward_std": 6.580064730442805,
    "timesteps": 501676170,
    "learntime": 0.30250465008430183,
    "sampletime": 8.747572337975726,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1418,
    "reward_mean": 16.4138998286556,
    "reward_max": 22.639697802009657,
    "reward_min": 0.20133181823378146,
    "reward_std": 5.30407838343203,
    "timesteps": 502030095,
    "learntime": 0.23745346209034324,
    "sampletime": 8.826292334822938,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1419,
    "reward_mean": 18.118772875988803,
    "reward_max": 23.021018899109386,
    "reward_min": 0.5288548325188401,
    "reward_std": 4.482037737104415,
    "timesteps": 502386711,
    "learntime": 0.23290885612368584,
    "sampletime": 8.88613158185035,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1420,
    "reward_mean": 18.48237760650752,
    "reward_max": 22.825123599893594,
    "reward_min": 0.38606632407049185,
    "reward_std": 4.326796497983396,
    "timesteps": 502744779,
    "learntime": 0.2653195590246469,
    "sampletime": 9.032296834047884,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1421,
    "reward_mean": 16.206664202590673,
    "reward_max": 22.66327670876048,
    "reward_min": -5.592845406758396,
    "reward_std": 6.83787886123002,
    "timesteps": 503097996,
    "learntime": 0.23253320902585983,
    "sampletime": 8.920595635892823,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1422,
    "reward_mean": 17.382622899255445,
    "reward_max": 22.704781805203467,
    "reward_min": 0.35083324182425585,
    "reward_std": 5.147619637994325,
    "timesteps": 503455152,
    "learntime": 0.29812665400095284,
    "sampletime": 8.913593282923102,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1423,
    "reward_mean": 14.639292699673511,
    "reward_max": 22.70871608975258,
    "reward_min": -7.524730035730194,
    "reward_std": 7.395013471572587,
    "timesteps": 503805396,
    "learntime": 0.23517951788380742,
    "sampletime": 8.776869338937104,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1424,
    "reward_mean": 17.108045071370956,
    "reward_max": 22.799369644108637,
    "reward_min": 0.5811983494301423,
    "reward_std": 5.402239129371622,
    "timesteps": 504157725,
    "learntime": 0.2831855518743396,
    "sampletime": 8.906792376190424,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1425,
    "reward_mean": 17.24959221361233,
    "reward_max": 23.13046394485388,
    "reward_min": 0.11732338471901729,
    "reward_std": 6.0022887130951394,
    "timesteps": 504512025,
    "learntime": 0.23567081079818308,
    "sampletime": 8.90548979700543,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1426,
    "reward_mean": 12.031247137798639,
    "reward_max": 22.961354219830937,
    "reward_min": -16.288861338760608,
    "reward_std": 9.597877586737882,
    "timesteps": 504858705,
    "learntime": 0.2777646789327264,
    "sampletime": 8.64784846198745,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1427,
    "reward_mean": 15.280905998016461,
    "reward_max": 22.27133949642479,
    "reward_min": -8.28558894190373,
    "reward_std": 8.020695067820018,
    "timesteps": 505209126,
    "learntime": 0.2302115170750767,
    "sampletime": 8.736319153103977,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1428,
    "reward_mean": 15.667383647173363,
    "reward_max": 22.882925346105665,
    "reward_min": -1.0243098707922618,
    "reward_std": 6.877835608593988,
    "timesteps": 505560417,
    "learntime": 0.27646841504611075,
    "sampletime": 8.90439899591729,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1429,
    "reward_mean": 15.098732385578792,
    "reward_max": 23.510218653813787,
    "reward_min": -20.050162544220015,
    "reward_std": 8.937491811011647,
    "timesteps": 505911918,
    "learntime": 0.2350485110655427,
    "sampletime": 8.89720594487153,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1430,
    "reward_mean": 16.04540404540002,
    "reward_max": 23.148131828853913,
    "reward_min": -10.695027837558,
    "reward_std": 7.322264427474627,
    "timesteps": 506264430,
    "learntime": 0.27871731691993773,
    "sampletime": 8.83170864987187,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1431,
    "reward_mean": 19.234673080344578,
    "reward_max": 23.157334758561436,
    "reward_min": 0.2063146849395685,
    "reward_std": 4.192604794554194,
    "timesteps": 506622558,
    "learntime": 0.223969321930781,
    "sampletime": 8.924853709992021,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1432,
    "reward_mean": 15.570676605993352,
    "reward_max": 21.814136251535576,
    "reward_min": -0.7200443507736622,
    "reward_std": 6.623023455577478,
    "timesteps": 506976954,
    "learntime": 0.28350531007163227,
    "sampletime": 8.847888117888942,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1433,
    "reward_mean": 15.904525465024337,
    "reward_max": 22.746724451144196,
    "reward_min": -11.258978310012909,
    "reward_std": 7.204764091843876,
    "timesteps": 507327981,
    "learntime": 0.2351337280124426,
    "sampletime": 8.929510387126356,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1434,
    "reward_mean": 15.084528209206002,
    "reward_max": 22.102625032999743,
    "reward_min": -9.936657314388105,
    "reward_std": 7.3710633914013926,
    "timesteps": 507679281,
    "learntime": 0.2891289610415697,
    "sampletime": 8.855682727880776,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1435,
    "reward_mean": 18.204513403436106,
    "reward_max": 23.311897802004363,
    "reward_min": -0.8054282872330863,
    "reward_std": 4.7932653805749075,
    "timesteps": 508034457,
    "learntime": 0.23914658511057496,
    "sampletime": 8.866870920173824,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1436,
    "reward_mean": 16.228726656526074,
    "reward_max": 22.203064034259608,
    "reward_min": -2.1598278769145587,
    "reward_std": 6.921672338963558,
    "timesteps": 508387395,
    "learntime": 0.2808402730152011,
    "sampletime": 8.949764649150893,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1437,
    "reward_mean": 14.118778478544789,
    "reward_max": 22.605412242595452,
    "reward_min": -22.51026230618696,
    "reward_std": 8.801874272610844,
    "timesteps": 508735230,
    "learntime": 0.2344258080702275,
    "sampletime": 8.80179744400084,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1438,
    "reward_mean": 15.43658993841687,
    "reward_max": 22.29403317753564,
    "reward_min": -1.0958616222029187,
    "reward_std": 6.669770005739933,
    "timesteps": 509084073,
    "learntime": 0.28672290104441345,
    "sampletime": 8.723118572961539,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1439,
    "reward_mean": 15.416626378250024,
    "reward_max": 22.740191398957514,
    "reward_min": -12.246677583422171,
    "reward_std": 7.0149644177014565,
    "timesteps": 509435019,
    "learntime": 0.24057228304445744,
    "sampletime": 8.766426973976195,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1440,
    "reward_mean": 15.405014221748424,
    "reward_max": 21.959369396057095,
    "reward_min": -12.325502536155522,
    "reward_std": 7.521683781065413,
    "timesteps": 509787678,
    "learntime": 0.2810030479449779,
    "sampletime": 8.891850902000442,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1441,
    "reward_mean": 17.76080751395333,
    "reward_max": 22.25119638423237,
    "reward_min": 7.58843131810709,
    "reward_std": 4.427446560565449,
    "timesteps": 510143769,
    "learntime": 0.23582254094071686,
    "sampletime": 8.851511008106172,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1442,
    "reward_mean": 17.102189818965265,
    "reward_max": 22.553814160051953,
    "reward_min": 7.256994532130193,
    "reward_std": 4.821216781699773,
    "timesteps": 510499614,
    "learntime": 0.28395033185370266,
    "sampletime": 8.853383196983486,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1443,
    "reward_mean": 15.951285213367854,
    "reward_max": 22.057367674667724,
    "reward_min": -0.8648525708439675,
    "reward_std": 5.734704950403759,
    "timesteps": 510852522,
    "learntime": 0.23642778699286282,
    "sampletime": 8.936587005853653,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1444,
    "reward_mean": 16.482258453872454,
    "reward_max": 22.074977074979063,
    "reward_min": 6.64810454947027,
    "reward_std": 4.748737203670608,
    "timesteps": 511206525,
    "learntime": 0.29679739102721214,
    "sampletime": 8.809046998852864,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1445,
    "reward_mean": 16.680514606196702,
    "reward_max": 21.59876428233022,
    "reward_min": -0.8582306543284033,
    "reward_std": 4.776233048789852,
    "timesteps": 511562499,
    "learntime": 0.24079919792711735,
    "sampletime": 8.922941390890628,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1446,
    "reward_mean": 16.264163436582766,
    "reward_max": 21.945567168780446,
    "reward_min": -0.3795654925969307,
    "reward_std": 5.35844068068344,
    "timesteps": 511916082,
    "learntime": 0.2745034000836313,
    "sampletime": 8.866728367982432,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1447,
    "reward_mean": 17.67209891138629,
    "reward_max": 23.0954672764514,
    "reward_min": -2.390176438176159,
    "reward_std": 5.136029820098644,
    "timesteps": 512272230,
    "learntime": 0.240636341040954,
    "sampletime": 8.940894735045731,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1448,
    "reward_mean": 15.166056069408413,
    "reward_max": 21.26114211641392,
    "reward_min": -22.13153042307363,
    "reward_std": 7.62993146857666,
    "timesteps": 512626446,
    "learntime": 0.2314768279902637,
    "sampletime": 8.892954749055207,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1449,
    "reward_mean": 17.063875242700252,
    "reward_max": 21.714115346323293,
    "reward_min": 6.712222923679899,
    "reward_std": 3.895393069161506,
    "timesteps": 512983977,
    "learntime": 0.22837828705087304,
    "sampletime": 8.880231486167759,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1450,
    "reward_mean": 14.974912986856712,
    "reward_max": 21.070032495162913,
    "reward_min": -1.2937098089782013,
    "reward_std": 5.788472647388659,
    "timesteps": 513336540,
    "learntime": 0.2321474370546639,
    "sampletime": 8.892164089018479,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1451,
    "reward_mean": 16.364104749343245,
    "reward_max": 20.96329425714176,
    "reward_min": -2.297461638091288,
    "reward_std": 4.854763087355238,
    "timesteps": 513692097,
    "learntime": 0.23119710199534893,
    "sampletime": 8.819146414054558,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1452,
    "reward_mean": 18.92123443114614,
    "reward_max": 21.81195469019285,
    "reward_min": 15.187965900340878,
    "reward_std": 1.4135716410643004,
    "timesteps": 514052817,
    "learntime": 0.2364604971371591,
    "sampletime": 8.734311765059829,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1453,
    "reward_mean": 15.25789244186953,
    "reward_max": 21.53596026753884,
    "reward_min": -5.3022751002078605,
    "reward_std": 5.7431013084459295,
    "timesteps": 514406274,
    "learntime": 0.23914950713515282,
    "sampletime": 8.799527442082763,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1454,
    "reward_mean": 15.356384463928189,
    "reward_max": 21.849026951741312,
    "reward_min": -1.9250050850642964,
    "reward_std": 5.8259987429732885,
    "timesteps": 514759407,
    "learntime": 0.23193912487477064,
    "sampletime": 8.757883633021265,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1455,
    "reward_mean": 15.651623609190096,
    "reward_max": 22.175275449993823,
    "reward_min": -2.740695645496476,
    "reward_std": 6.147915312861294,
    "timesteps": 515111688,
    "learntime": 0.23773891804739833,
    "sampletime": 8.944552698172629,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1456,
    "reward_mean": 12.960551322396444,
    "reward_max": 21.226689585948602,
    "reward_min": -11.328510933365164,
    "reward_std": 7.2991414301748145,
    "timesteps": 515458530,
    "learntime": 0.24377351091243327,
    "sampletime": 8.74433749797754,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1457,
    "reward_mean": 15.066223502274692,
    "reward_max": 22.688198187078044,
    "reward_min": -0.7924763200296202,
    "reward_std": 6.333664342671688,
    "timesteps": 515808348,
    "learntime": 0.2355091602075845,
    "sampletime": 8.793786292895675,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1458,
    "reward_mean": 13.891179741804915,
    "reward_max": 21.55909733643762,
    "reward_min": -11.458604655369669,
    "reward_std": 6.976105823519936,
    "timesteps": 516157983,
    "learntime": 0.23949854308739305,
    "sampletime": 8.77686833194457,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1459,
    "reward_mean": 15.274709811221417,
    "reward_max": 21.778081472445695,
    "reward_min": -2.3636242196111255,
    "reward_std": 6.612919437076285,
    "timesteps": 516508374,
    "learntime": 0.22791409492492676,
    "sampletime": 8.834876884007826,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1460,
    "reward_mean": 15.000454345241195,
    "reward_max": 22.662324399528895,
    "reward_min": -1.505705008638679,
    "reward_std": 6.826437758157185,
    "timesteps": 516857874,
    "learntime": 0.23060066113248467,
    "sampletime": 8.85756998998113,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1461,
    "reward_mean": 15.011638783559604,
    "reward_max": 22.200880392660938,
    "reward_min": -1.2677611814543701,
    "reward_std": 6.018684456563752,
    "timesteps": 517209930,
    "learntime": 0.231801024870947,
    "sampletime": 8.84768831403926,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1462,
    "reward_mean": 17.98120917405516,
    "reward_max": 22.123338378652765,
    "reward_min": 7.05172785309453,
    "reward_std": 4.4014399394589105,
    "timesteps": 517566261,
    "learntime": 0.2384858699515462,
    "sampletime": 8.951029407093301,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1463,
    "reward_mean": 15.589115769302666,
    "reward_max": 22.721602802277737,
    "reward_min": -3.4909469963502975,
    "reward_std": 6.563839082742279,
    "timesteps": 517916232,
    "learntime": 0.2436961659695953,
    "sampletime": 8.807551700156182,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1464,
    "reward_mean": 17.443531504731027,
    "reward_max": 22.595900483623453,
    "reward_min": 0.30292506249517953,
    "reward_std": 4.850989618766459,
    "timesteps": 518272929,
    "learntime": 0.23876853985711932,
    "sampletime": 8.994940616888925,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1465,
    "reward_mean": 16.362073978378568,
    "reward_max": 22.28218052570644,
    "reward_min": -0.5948060698256993,
    "reward_std": 5.562518816281965,
    "timesteps": 518627037,
    "learntime": 0.23108995892107487,
    "sampletime": 8.78320460114628,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1466,
    "reward_mean": 17.647401687648795,
    "reward_max": 22.55348802859909,
    "reward_min": -12.1780087353704,
    "reward_std": 7.227754979824947,
    "timesteps": 518981226,
    "learntime": 0.23734197090379894,
    "sampletime": 8.798793524038047,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1467,
    "reward_mean": 13.727960156360723,
    "reward_max": 22.87192263111831,
    "reward_min": -10.495371124382611,
    "reward_std": 8.412076978441279,
    "timesteps": 519329520,
    "learntime": 0.23228576499968767,
    "sampletime": 8.789407431147993,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1468,
    "reward_mean": 15.58998918546574,
    "reward_max": 22.348570552718066,
    "reward_min": -20.504996191251625,
    "reward_std": 7.7346757414585205,
    "timesteps": 519679611,
    "learntime": 0.23179892916232347,
    "sampletime": 8.785360063891858,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1469,
    "reward_mean": 16.332983394482632,
    "reward_max": 23.430180275417626,
    "reward_min": -11.924460652585061,
    "reward_std": 7.128044392365985,
    "timesteps": 520029033,
    "learntime": 0.23267044709064066,
    "sampletime": 8.914773193886504,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1470,
    "reward_mean": 17.957727310064943,
    "reward_max": 23.180302992859104,
    "reward_min": 0.8125376052956849,
    "reward_std": 5.0011178711908055,
    "timesteps": 520383633,
    "learntime": 0.23281668196432292,
    "sampletime": 8.802016898058355,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1471,
    "reward_mean": 16.65832121827455,
    "reward_max": 23.082279239470765,
    "reward_min": -10.645793855472503,
    "reward_std": 6.527451600318341,
    "timesteps": 520737405,
    "learntime": 0.22885307506658137,
    "sampletime": 8.797772199846804,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1472,
    "reward_mean": 16.767600993143482,
    "reward_max": 23.04310429730619,
    "reward_min": -7.929768557142883,
    "reward_std": 6.78460444044179,
    "timesteps": 521087736,
    "learntime": 0.23724601999856532,
    "sampletime": 8.84049957501702,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1473,
    "reward_mean": 18.844248808643485,
    "reward_max": 23.68698864808009,
    "reward_min": 0.127155192383927,
    "reward_std": 4.302962640748951,
    "timesteps": 521444907,
    "learntime": 0.23446527495980263,
    "sampletime": 9.073253340087831,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1474,
    "reward_mean": 17.235092578843833,
    "reward_max": 23.11361239423665,
    "reward_min": -10.218762937425218,
    "reward_std": 6.469902113291932,
    "timesteps": 521797914,
    "learntime": 0.23541789688169956,
    "sampletime": 8.83085676212795,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1475,
    "reward_mean": 15.856965716266886,
    "reward_max": 22.62195353957014,
    "reward_min": -20.72995283106117,
    "reward_std": 7.151109475388065,
    "timesteps": 522150462,
    "learntime": 0.24100147187709808,
    "sampletime": 8.8361643969547,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1476,
    "reward_mean": 16.006616730775036,
    "reward_max": 23.038373469290406,
    "reward_min": -8.456266954049687,
    "reward_std": 7.122272645262557,
    "timesteps": 522501597,
    "learntime": 0.23793219705112278,
    "sampletime": 8.777472621994093,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1477,
    "reward_mean": 13.799885547517409,
    "reward_max": 23.069438245563738,
    "reward_min": -0.8674259100913612,
    "reward_std": 7.754947079390605,
    "timesteps": 522847860,
    "learntime": 0.23922244110144675,
    "sampletime": 8.593027224997059,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1478,
    "reward_mean": 15.059401445501814,
    "reward_max": 23.72577624831517,
    "reward_min": -0.714958289613471,
    "reward_std": 7.219565616638021,
    "timesteps": 523197540,
    "learntime": 0.23937436589039862,
    "sampletime": 8.665153732988983,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1479,
    "reward_mean": 15.151243340397397,
    "reward_max": 23.273484587380754,
    "reward_min": -1.7494985760528314,
    "reward_std": 7.638689241630076,
    "timesteps": 523546095,
    "learntime": 0.23478898499161005,
    "sampletime": 8.824477760819718,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1480,
    "reward_mean": 17.116886768420187,
    "reward_max": 23.812772382267408,
    "reward_min": -0.4130663246368,
    "reward_std": 5.515679104610906,
    "timesteps": 523898976,
    "learntime": 0.23435467784292996,
    "sampletime": 8.7530136059504,
    "best_max_mean": 17.889918623988216,
    "best_max": 23.95931725036071
  },
  {
    "gen": 1481,
    "reward_mean": 16.604325324685654,
    "reward_max": 24.07411085208172,
    "reward_min": -1.3299181818411754,
    "reward_std": 5.543665712040906,
    "timesteps": 524253102,
    "learntime": 0.23947009490802884,
    "sampletime": 8.804123805137351,
    "best_max_mean": 16.604325324685654,
    "best_max": 24.07411085208172
  },
  {
    "gen": 1482,
    "reward_mean": 15.328219346294812,
    "reward_max": 23.149562322957944,
    "reward_min": -16.629255972259372,
    "reward_std": 7.060087836804617,
    "timesteps": 524604615,
    "learntime": 0.22799777891486883,
    "sampletime": 8.759992316132411,
    "best_max_mean": 16.604325324685654,
    "best_max": 24.07411085208172
  },
  {
    "gen": 1483,
    "reward_mean": 17.007988785544654,
    "reward_max": 24.106941965833713,
    "reward_min": -0.3609311562207942,
    "reward_std": 5.58915614819219,
    "timesteps": 524959200,
    "learntime": 0.24235618603415787,
    "sampletime": 8.723975637927651,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1484,
    "reward_mean": 16.625657496313032,
    "reward_max": 22.12241100683406,
    "reward_min": -1.1210523445360348,
    "reward_std": 6.116911381911784,
    "timesteps": 525311733,
    "learntime": 0.2440148121677339,
    "sampletime": 8.705497229006141,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1485,
    "reward_mean": 14.460518274260021,
    "reward_max": 22.26496892894565,
    "reward_min": -10.555011488723038,
    "reward_std": 7.567289462905076,
    "timesteps": 525661317,
    "learntime": 0.23470559692941606,
    "sampletime": 8.563275425927714,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1486,
    "reward_mean": 16.416900589820028,
    "reward_max": 23.787287108118605,
    "reward_min": -11.153126785002483,
    "reward_std": 7.467332071467169,
    "timesteps": 526012479,
    "learntime": 0.23909691418521106,
    "sampletime": 8.841152648907155,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1487,
    "reward_mean": 19.18742224294509,
    "reward_max": 23.026959772362847,
    "reward_min": -4.335077727565393,
    "reward_std": 4.767094810195809,
    "timesteps": 526370292,
    "learntime": 0.2393538171891123,
    "sampletime": 8.939401629846543,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1488,
    "reward_mean": 18.718613227873806,
    "reward_max": 22.687910096354738,
    "reward_min": 0.17122426063217525,
    "reward_std": 4.589290868872465,
    "timesteps": 526727478,
    "learntime": 0.24687270796857774,
    "sampletime": 9.007098849164322,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1489,
    "reward_mean": 17.19665844682639,
    "reward_max": 22.174603537083104,
    "reward_min": 1.4443961969195183,
    "reward_std": 4.990052000797178,
    "timesteps": 527083323,
    "learntime": 0.23758228798396885,
    "sampletime": 8.894330783048645,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1490,
    "reward_mean": 16.4016656606464,
    "reward_max": 23.082075462748914,
    "reward_min": -0.7224068943989699,
    "reward_std": 5.975537985782857,
    "timesteps": 527435703,
    "learntime": 0.23635322111658752,
    "sampletime": 8.822867552982643,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1491,
    "reward_mean": 17.39988524381686,
    "reward_max": 22.909949617240326,
    "reward_min": 0.7781712556930458,
    "reward_std": 5.3815261045498515,
    "timesteps": 527789598,
    "learntime": 0.2978132599964738,
    "sampletime": 8.86471180897206,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1492,
    "reward_mean": 17.47531641277059,
    "reward_max": 22.43974047425118,
    "reward_min": -1.899024779442703,
    "reward_std": 6.213211973786197,
    "timesteps": 528143340,
    "learntime": 0.23204806493595243,
    "sampletime": 8.828459157142788,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1493,
    "reward_mean": 16.741495634317186,
    "reward_max": 22.738590612887602,
    "reward_min": -10.755649574566634,
    "reward_std": 5.993425803451574,
    "timesteps": 528496548,
    "learntime": 0.281699056038633,
    "sampletime": 8.89917986607179,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1494,
    "reward_mean": 16.076954516608662,
    "reward_max": 21.584879033443887,
    "reward_min": -1.8432154281375317,
    "reward_std": 5.4692244341078835,
    "timesteps": 528851517,
    "learntime": 0.23797632893547416,
    "sampletime": 8.82730009383522,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1495,
    "reward_mean": 17.154320948994037,
    "reward_max": 23.68005919322427,
    "reward_min": 0.014112380135692281,
    "reward_std": 5.683459452883371,
    "timesteps": 529204011,
    "learntime": 0.30096451798453927,
    "sampletime": 8.946080937050283,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1496,
    "reward_mean": 17.058117331079544,
    "reward_max": 23.389282943631496,
    "reward_min": -0.3564434269921746,
    "reward_std": 5.593462915318184,
    "timesteps": 529559754,
    "learntime": 0.24523249687626958,
    "sampletime": 8.978029073914513,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1497,
    "reward_mean": 17.44504379024369,
    "reward_max": 22.617099073805473,
    "reward_min": -1.6400859570659845,
    "reward_std": 5.562137673472358,
    "timesteps": 529914555,
    "learntime": 0.2869886099360883,
    "sampletime": 8.876785934902728,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1498,
    "reward_mean": 18.220101485100002,
    "reward_max": 22.61877060184875,
    "reward_min": 8.003041666890072,
    "reward_std": 3.0123816463604487,
    "timesteps": 530272986,
    "learntime": 0.24597962899133563,
    "sampletime": 8.889416923979297,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1499,
    "reward_mean": 16.12741770830943,
    "reward_max": 21.844405263992172,
    "reward_min": -3.0071179129149823,
    "reward_std": 5.194821936631407,
    "timesteps": 530628351,
    "learntime": 0.28920173505321145,
    "sampletime": 8.836346227908507,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1500,
    "reward_mean": 17.763114904518147,
    "reward_max": 22.74660535883441,
    "reward_min": 0.45909899437912477,
    "reward_std": 4.47976555604002,
    "timesteps": 530985282,
    "learntime": 0.24086426198482513,
    "sampletime": 8.650186883984134,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1501,
    "reward_mean": 17.119536141290343,
    "reward_max": 22.17579858513394,
    "reward_min": 7.045559435539567,
    "reward_std": 3.641676266461676,
    "timesteps": 531342573,
    "learntime": 0.28405538108199835,
    "sampletime": 8.71582961594686,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1502,
    "reward_mean": 16.9520523119749,
    "reward_max": 21.12388816174599,
    "reward_min": 6.353002847249922,
    "reward_std": 3.632482027302862,
    "timesteps": 531699981,
    "learntime": 0.2426540032029152,
    "sampletime": 8.933736850041896,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1503,
    "reward_mean": 16.450908437183415,
    "reward_max": 22.697559016022936,
    "reward_min": -1.3239285338504176,
    "reward_std": 4.997645004740978,
    "timesteps": 532056186,
    "learntime": 0.29164755903184414,
    "sampletime": 8.846853449940681,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1504,
    "reward_mean": 15.018808046537108,
    "reward_max": 22.564696204822724,
    "reward_min": -1.4914301329038446,
    "reward_std": 6.236159620292833,
    "timesteps": 532409154,
    "learntime": 0.24286810401827097,
    "sampletime": 8.7763256279286,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1505,
    "reward_mean": 16.98263102758562,
    "reward_max": 21.17071164436427,
    "reward_min": 1.713038089504047,
    "reward_std": 3.795278038765652,
    "timesteps": 532766625,
    "learntime": 0.2754014760721475,
    "sampletime": 8.905555813806131,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1506,
    "reward_mean": 16.09889092185869,
    "reward_max": 21.182085334776072,
    "reward_min": 0.2689720660688016,
    "reward_std": 4.380612823336728,
    "timesteps": 533123808,
    "learntime": 0.24634150904603302,
    "sampletime": 8.9230204410851,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1507,
    "reward_mean": 16.81198546057994,
    "reward_max": 20.935708939865844,
    "reward_min": 7.338586186239613,
    "reward_std": 3.1073865791997934,
    "timesteps": 533482569,
    "learntime": 0.2927446379326284,
    "sampletime": 8.9285353270825,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1508,
    "reward_mean": 16.26066535835102,
    "reward_max": 21.236731333940323,
    "reward_min": 0.32688404024197365,
    "reward_std": 4.899459959769192,
    "timesteps": 533838057,
    "learntime": 0.23661361890845,
    "sampletime": 8.949296365957707,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1509,
    "reward_mean": 17.20990029850073,
    "reward_max": 22.877890935691543,
    "reward_min": 0.9787956050713508,
    "reward_std": 4.050657224217668,
    "timesteps": 534195075,
    "learntime": 0.28874917491339147,
    "sampletime": 9.028143918840215,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1510,
    "reward_mean": 17.15485148111633,
    "reward_max": 21.349596060099866,
    "reward_min": -1.0391038780014212,
    "reward_std": 4.3259643677136745,
    "timesteps": 534551406,
    "learntime": 0.2402341179549694,
    "sampletime": 9.00036078505218,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1511,
    "reward_mean": 17.773344790641808,
    "reward_max": 22.137172962678246,
    "reward_min": 6.019798760133034,
    "reward_std": 3.776324036571397,
    "timesteps": 534908778,
    "learntime": 0.28890738100744784,
    "sampletime": 8.948723712004721,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1512,
    "reward_mean": 13.848393760548852,
    "reward_max": 22.422943321330063,
    "reward_min": -7.1498160901117265,
    "reward_std": 6.882038014864516,
    "timesteps": 535259679,
    "learntime": 0.24424446001648903,
    "sampletime": 8.85251072095707,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1513,
    "reward_mean": 16.917656443803246,
    "reward_max": 22.115377247114814,
    "reward_min": 4.8478258958185085,
    "reward_std": 4.2241670802126725,
    "timesteps": 535616190,
    "learntime": 0.28407533606514335,
    "sampletime": 8.81689682090655,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1514,
    "reward_mean": 16.90204580335481,
    "reward_max": 21.9136175432059,
    "reward_min": -12.740316741133226,
    "reward_std": 5.426017332229015,
    "timesteps": 535972818,
    "learntime": 0.2403071050066501,
    "sampletime": 8.855053271865472,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1515,
    "reward_mean": 17.505505323100977,
    "reward_max": 21.99109611917766,
    "reward_min": 5.538216815442975,
    "reward_std": 3.9759717024553893,
    "timesteps": 536330433,
    "learntime": 0.3043523491360247,
    "sampletime": 8.99442883208394,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1516,
    "reward_mean": 18.133408768384015,
    "reward_max": 21.688774154103484,
    "reward_min": 7.871422732286825,
    "reward_std": 2.6647093047111365,
    "timesteps": 536690241,
    "learntime": 0.24610727792605758,
    "sampletime": 9.013891363050789,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1517,
    "reward_mean": 17.542939084415966,
    "reward_max": 23.61738207803643,
    "reward_min": 1.6566435136433368,
    "reward_std": 4.6393504336704385,
    "timesteps": 537045981,
    "learntime": 0.26612028502859175,
    "sampletime": 8.960999763105065,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1518,
    "reward_mean": 18.301922946406386,
    "reward_max": 21.875328160222672,
    "reward_min": 7.734122336554315,
    "reward_std": 3.3210535661555167,
    "timesteps": 537404388,
    "learntime": 0.230753110954538,
    "sampletime": 8.834762013051659,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1519,
    "reward_mean": 17.89395556597642,
    "reward_max": 22.6507126522354,
    "reward_min": -2.034792758021722,
    "reward_std": 4.3885593138202,
    "timesteps": 537761856,
    "learntime": 0.30578022985719144,
    "sampletime": 8.830556261120364,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1520,
    "reward_mean": 15.761195439063888,
    "reward_max": 20.936118852696385,
    "reward_min": -3.4782808311283606,
    "reward_std": 5.70251700360303,
    "timesteps": 538116147,
    "learntime": 0.2382138930261135,
    "sampletime": 8.919771485961974,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1521,
    "reward_mean": 17.84870192811582,
    "reward_max": 22.017232749300703,
    "reward_min": 7.587692517603781,
    "reward_std": 3.214091253742581,
    "timesteps": 538474623,
    "learntime": 0.29729179688729346,
    "sampletime": 9.00292909401469,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1522,
    "reward_mean": 16.664987389955193,
    "reward_max": 22.00305956435587,
    "reward_min": -1.1730762752986528,
    "reward_std": 5.326152154274491,
    "timesteps": 538831629,
    "learntime": 0.23305523488670588,
    "sampletime": 8.928959948010743,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1523,
    "reward_mean": 18.899343234032088,
    "reward_max": 22.10425979288287,
    "reward_min": 9.343344897704403,
    "reward_std": 2.438158056207497,
    "timesteps": 539191302,
    "learntime": 0.236743011046201,
    "sampletime": 8.868044629925862,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1524,
    "reward_mean": 16.626555609984642,
    "reward_max": 22.941246415728312,
    "reward_min": -4.7555476719082295,
    "reward_std": 5.978579102202142,
    "timesteps": 539545107,
    "learntime": 0.23949706298299134,
    "sampletime": 8.892667012056336,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1525,
    "reward_mean": 17.051881447299948,
    "reward_max": 22.544657202975497,
    "reward_min": -0.2693062131616519,
    "reward_std": 4.763347202292785,
    "timesteps": 539900124,
    "learntime": 0.23601686605252326,
    "sampletime": 8.785808969987556,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1526,
    "reward_mean": 17.880857799538433,
    "reward_max": 22.57063730158419,
    "reward_min": 7.806515398265963,
    "reward_std": 4.412148548260926,
    "timesteps": 540255636,
    "learntime": 0.23582495609298348,
    "sampletime": 8.943379553034902,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1527,
    "reward_mean": 16.007737047497635,
    "reward_max": 22.24787568772445,
    "reward_min": -0.8376728626193852,
    "reward_std": 6.092842126909577,
    "timesteps": 540609078,
    "learntime": 0.23401939403265715,
    "sampletime": 8.74694417300634,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1528,
    "reward_mean": 17.3941364765507,
    "reward_max": 22.44584984539114,
    "reward_min": -0.2406831106989535,
    "reward_std": 5.233602275126384,
    "timesteps": 540964524,
    "learntime": 0.23510861000977457,
    "sampletime": 8.821044160053134,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1529,
    "reward_mean": 17.41108078505713,
    "reward_max": 23.029078719382536,
    "reward_min": -0.806109745111879,
    "reward_std": 5.674216205693143,
    "timesteps": 541320696,
    "learntime": 0.2412554849870503,
    "sampletime": 8.85252208611928,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1530,
    "reward_mean": 16.199276034697522,
    "reward_max": 23.360332826667506,
    "reward_min": -11.62897770187225,
    "reward_std": 6.917864329429969,
    "timesteps": 541674960,
    "learntime": 0.2325285649858415,
    "sampletime": 8.951281115878373,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1531,
    "reward_mean": 17.197343134284978,
    "reward_max": 23.055249667147905,
    "reward_min": -2.0081005485474432,
    "reward_std": 5.7282888862312324,
    "timesteps": 542031345,
    "learntime": 0.23079259390942752,
    "sampletime": 8.62159295193851,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1532,
    "reward_mean": 19.30950984546675,
    "reward_max": 23.159296031852577,
    "reward_min": 8.74943519294946,
    "reward_std": 3.116517173373628,
    "timesteps": 542389986,
    "learntime": 0.2384112630970776,
    "sampletime": 8.922713659936562,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1533,
    "reward_mean": 15.06680367377282,
    "reward_max": 22.604757835231293,
    "reward_min": -9.820664759753553,
    "reward_std": 7.626415459105428,
    "timesteps": 542739786,
    "learntime": 0.23393870191648602,
    "sampletime": 8.771380006102845,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1534,
    "reward_mean": 13.304205289586847,
    "reward_max": 22.467938057121092,
    "reward_min": -31.961980566706963,
    "reward_std": 9.753912733309775,
    "timesteps": 543084657,
    "learntime": 0.25094343116506934,
    "sampletime": 8.710141530027613,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1535,
    "reward_mean": 12.668408961559814,
    "reward_max": 22.628537470940497,
    "reward_min": -8.814199524174908,
    "reward_std": 8.049098068922877,
    "timesteps": 543431352,
    "learntime": 0.23955255700275302,
    "sampletime": 8.834254949120805,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1536,
    "reward_mean": 14.989688896708453,
    "reward_max": 23.34750243291527,
    "reward_min": -12.64335540755455,
    "reward_std": 7.82381340075038,
    "timesteps": 543780945,
    "learntime": 0.24379326100461185,
    "sampletime": 8.717868169071153,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1537,
    "reward_mean": 15.673154708484853,
    "reward_max": 22.885168925186562,
    "reward_min": -3.6057198248648414,
    "reward_std": 6.926873270229873,
    "timesteps": 544132710,
    "learntime": 0.2391367950476706,
    "sampletime": 8.757344099925831,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1538,
    "reward_mean": 16.313012001808886,
    "reward_max": 23.634753851056413,
    "reward_min": -10.695510622300917,
    "reward_std": 7.5059826634740725,
    "timesteps": 544485192,
    "learntime": 0.24232772807590663,
    "sampletime": 8.76491858321242,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1539,
    "reward_mean": 16.120859096546916,
    "reward_max": 22.828516036964075,
    "reward_min": 1.6927808661624182,
    "reward_std": 5.416571761719461,
    "timesteps": 544836552,
    "learntime": 0.2351228049956262,
    "sampletime": 8.903881269041449,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1540,
    "reward_mean": 16.134547490049158,
    "reward_max": 22.464088436607693,
    "reward_min": -10.759504436607001,
    "reward_std": 6.890666872457394,
    "timesteps": 545190369,
    "learntime": 0.24349877797067165,
    "sampletime": 8.828523187199607,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1541,
    "reward_mean": 14.021674339241958,
    "reward_max": 23.27108387102965,
    "reward_min": -11.58490071533192,
    "reward_std": 7.646735808723412,
    "timesteps": 545539767,
    "learntime": 0.23714863089844584,
    "sampletime": 8.819209543056786,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1542,
    "reward_mean": 14.424218752736081,
    "reward_max": 23.485826736051504,
    "reward_min": -10.638211483289275,
    "reward_std": 7.113540071448867,
    "timesteps": 545891085,
    "learntime": 0.23814367991872132,
    "sampletime": 8.81039981590584,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1543,
    "reward_mean": 18.140253507614382,
    "reward_max": 22.330833177237455,
    "reward_min": -3.0721962836458228,
    "reward_std": 4.906344959042182,
    "timesteps": 546248418,
    "learntime": 0.2366871340200305,
    "sampletime": 8.974365259055048,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1544,
    "reward_mean": 15.132075088996483,
    "reward_max": 22.870899569424278,
    "reward_min": -2.8213003934122933,
    "reward_std": 6.822594393732583,
    "timesteps": 546601545,
    "learntime": 0.2336785930674523,
    "sampletime": 8.666034570895135,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1545,
    "reward_mean": 16.795778134853727,
    "reward_max": 22.90323553597696,
    "reward_min": -1.1132150523816065,
    "reward_std": 6.030650100013058,
    "timesteps": 546956346,
    "learntime": 0.24534734804183245,
    "sampletime": 8.681570556014776,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1546,
    "reward_mean": 19.468285620956948,
    "reward_max": 22.9147178739782,
    "reward_min": 10.133486120876936,
    "reward_std": 2.2274915238929935,
    "timesteps": 547316769,
    "learntime": 0.24197992612607777,
    "sampletime": 8.765572359086946,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1547,
    "reward_mean": 16.615628236906662,
    "reward_max": 22.02888521444078,
    "reward_min": -0.8833672526772254,
    "reward_std": 5.127204075827775,
    "timesteps": 547671324,
    "learntime": 0.23329277988523245,
    "sampletime": 8.860167357837781,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1548,
    "reward_mean": 18.251729587045595,
    "reward_max": 22.393251899379365,
    "reward_min": -0.7597946852532105,
    "reward_std": 4.4596288250058365,
    "timesteps": 548028807,
    "learntime": 0.24630846199579537,
    "sampletime": 8.918110280064866,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1549,
    "reward_mean": 16.15102928966869,
    "reward_max": 22.5203251821892,
    "reward_min": -0.26096843329853375,
    "reward_std": 5.544185115260946,
    "timesteps": 548384823,
    "learntime": 0.24327665893360972,
    "sampletime": 8.813661623978987,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1550,
    "reward_mean": 18.60990477073704,
    "reward_max": 22.784964348753974,
    "reward_min": 1.3216403928712324,
    "reward_std": 3.850428803695802,
    "timesteps": 548743926,
    "learntime": 0.2502675799187273,
    "sampletime": 8.892823475878686,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1551,
    "reward_mean": 16.714269693059222,
    "reward_max": 22.242134988353218,
    "reward_min": -1.3671404110800494,
    "reward_std": 6.21104888821297,
    "timesteps": 549098388,
    "learntime": 0.23932684189639986,
    "sampletime": 8.654255277942866,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1552,
    "reward_mean": 16.46864515121913,
    "reward_max": 22.80318942851612,
    "reward_min": -1.0854768836465076,
    "reward_std": 5.583520382279277,
    "timesteps": 549454989,
    "learntime": 0.2544536308851093,
    "sampletime": 8.962264570174739,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1553,
    "reward_mean": 18.53343447940631,
    "reward_max": 21.54283127820852,
    "reward_min": 8.419566512799285,
    "reward_std": 2.9521887076191784,
    "timesteps": 549814626,
    "learntime": 0.2352978060953319,
    "sampletime": 8.921178226126358,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1554,
    "reward_mean": 18.007324662427294,
    "reward_max": 22.44155545063514,
    "reward_min": 8.382740512590818,
    "reward_std": 3.142079393613971,
    "timesteps": 550173363,
    "learntime": 0.2510813479311764,
    "sampletime": 8.894842783920467,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1555,
    "reward_mean": 15.66546278733799,
    "reward_max": 21.614526516376905,
    "reward_min": -2.7457404323733625,
    "reward_std": 5.748780783823609,
    "timesteps": 550527804,
    "learntime": 0.24533252092078328,
    "sampletime": 8.81151783815585,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1556,
    "reward_mean": 17.685306724985974,
    "reward_max": 21.793423319338924,
    "reward_min": 9.1733187138752,
    "reward_std": 3.353447732844961,
    "timesteps": 550885455,
    "learntime": 0.24543855106458068,
    "sampletime": 8.923295688815415,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1557,
    "reward_mean": 17.378816479893956,
    "reward_max": 21.995052166332513,
    "reward_min": -0.7161098525021948,
    "reward_std": 4.3562566543424275,
    "timesteps": 551244759,
    "learntime": 0.2354760190937668,
    "sampletime": 8.861221947940066,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1558,
    "reward_mean": 17.982528535952433,
    "reward_max": 21.384726458253816,
    "reward_min": 5.11116508136955,
    "reward_std": 2.7048979001482474,
    "timesteps": 551604633,
    "learntime": 0.24066727794706821,
    "sampletime": 8.954217812977731,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1559,
    "reward_mean": 17.77846817219687,
    "reward_max": 22.067859718752448,
    "reward_min": 7.936245497574819,
    "reward_std": 3.3111051147383583,
    "timesteps": 551963865,
    "learntime": 0.24873061198741198,
    "sampletime": 8.902512873988599,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1560,
    "reward_mean": 16.58980837754794,
    "reward_max": 21.397778797367607,
    "reward_min": -5.224760981902147,
    "reward_std": 5.22470263881345,
    "timesteps": 552321225,
    "learntime": 0.23341887583956122,
    "sampletime": 8.905576776945964,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1561,
    "reward_mean": 18.3960243452799,
    "reward_max": 21.76332331387999,
    "reward_min": 14.495743556992347,
    "reward_std": 1.440833076396917,
    "timesteps": 552681945,
    "learntime": 0.279787841020152,
    "sampletime": 8.994901919038966,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1562,
    "reward_mean": 16.91749896557971,
    "reward_max": 21.43213343642877,
    "reward_min": -10.034587876056323,
    "reward_std": 5.070174135942614,
    "timesteps": 553038261,
    "learntime": 0.24796488392166793,
    "sampletime": 8.849989356007427,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1563,
    "reward_mean": 17.10686380022326,
    "reward_max": 20.504900047929507,
    "reward_min": 6.019188431197435,
    "reward_std": 3.2618771559229773,
    "timesteps": 553396569,
    "learntime": 0.2477577649988234,
    "sampletime": 8.82396400696598,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1564,
    "reward_mean": 16.3942335273462,
    "reward_max": 22.190133990331855,
    "reward_min": -2.1825729150353292,
    "reward_std": 4.983496953349049,
    "timesteps": 553752891,
    "learntime": 0.27870642906054854,
    "sampletime": 8.943726382218301,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1565,
    "reward_mean": 16.764645486716176,
    "reward_max": 23.183708478313445,
    "reward_min": -1.6784274720606256,
    "reward_std": 4.423576408762222,
    "timesteps": 554109330,
    "learntime": 0.24400724121369421,
    "sampletime": 8.983431970933452,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1566,
    "reward_mean": 17.268184352141695,
    "reward_max": 21.567706360051297,
    "reward_min": -0.010900710130955874,
    "reward_std": 3.9901815981679483,
    "timesteps": 554467569,
    "learntime": 0.2828086849767715,
    "sampletime": 8.86190577200614,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1567,
    "reward_mean": 16.998436668772108,
    "reward_max": 21.753931538318284,
    "reward_min": -2.451673875816839,
    "reward_std": 4.193080129797037,
    "timesteps": 554824767,
    "learntime": 0.2556601269170642,
    "sampletime": 8.875378092983738,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1568,
    "reward_mean": 17.081139369554357,
    "reward_max": 22.150008872066703,
    "reward_min": -0.7049513733751779,
    "reward_std": 4.062367516442549,
    "timesteps": 555183939,
    "learntime": 0.28392383898608387,
    "sampletime": 8.942477593198419,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1569,
    "reward_mean": 18.16142223808277,
    "reward_max": 21.879497656941464,
    "reward_min": 6.595349198410102,
    "reward_std": 3.278195861857243,
    "timesteps": 555542625,
    "learntime": 0.24027528194710612,
    "sampletime": 8.970773494802415,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1570,
    "reward_mean": 17.352319302751294,
    "reward_max": 20.892665357582953,
    "reward_min": 6.960805311784937,
    "reward_std": 3.6491564779981656,
    "timesteps": 555901101,
    "learntime": 0.2885139109566808,
    "sampletime": 8.900671934010461,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1571,
    "reward_mean": 16.88161342520594,
    "reward_max": 21.988171948139392,
    "reward_min": -0.06476117108391738,
    "reward_std": 4.563538416154863,
    "timesteps": 556258191,
    "learntime": 0.24090152909047902,
    "sampletime": 8.883214105851948,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1572,
    "reward_mean": 18.477916351392796,
    "reward_max": 21.283053841046755,
    "reward_min": 6.05424342454044,
    "reward_std": 3.3522144606054924,
    "timesteps": 556616880,
    "learntime": 0.30464832205325365,
    "sampletime": 8.754509694874287,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1573,
    "reward_mean": 18.362394840551055,
    "reward_max": 21.462513280849002,
    "reward_min": 8.061909090011433,
    "reward_std": 3.0379094271481417,
    "timesteps": 556976187,
    "learntime": 0.2408141850028187,
    "sampletime": 8.796188339823857,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1574,
    "reward_mean": 18.121433044520685,
    "reward_max": 22.536035864333936,
    "reward_min": -1.2518919546608798,
    "reward_std": 4.152392233028628,
    "timesteps": 557335506,
    "learntime": 0.30888309492729604,
    "sampletime": 8.785713637014851,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1575,
    "reward_mean": 17.263385651918185,
    "reward_max": 22.88656606865609,
    "reward_min": -1.2628634523910771,
    "reward_std": 4.995030803967733,
    "timesteps": 557693052,
    "learntime": 0.24219493800774217,
    "sampletime": 8.905811744974926,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1576,
    "reward_mean": 18.212357784148615,
    "reward_max": 22.69493735656013,
    "reward_min": 0.7741505089709814,
    "reward_std": 4.173733406962576,
    "timesteps": 558050235,
    "learntime": 0.2956356049980968,
    "sampletime": 8.823481137864292,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1577,
    "reward_mean": 19.30650311334766,
    "reward_max": 22.46775995006883,
    "reward_min": 7.459905313913507,
    "reward_std": 2.660401647873944,
    "timesteps": 558410601,
    "learntime": 0.2387895118445158,
    "sampletime": 8.934980033896863,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1578,
    "reward_mean": 18.568266042653928,
    "reward_max": 22.852969168523686,
    "reward_min": -1.2352625677700777,
    "reward_std": 4.755682486979185,
    "timesteps": 558768858,
    "learntime": 0.281070931116119,
    "sampletime": 8.95455323299393,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1579,
    "reward_mean": 18.00098687609522,
    "reward_max": 23.526488356460256,
    "reward_min": 7.673379876745455,
    "reward_std": 4.444142273946903,
    "timesteps": 559125708,
    "learntime": 0.253779866034165,
    "sampletime": 9.016948817996308,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1580,
    "reward_mean": 18.77380003858248,
    "reward_max": 23.30567075426436,
    "reward_min": -0.8577104635205136,
    "reward_std": 5.450192914046678,
    "timesteps": 559483521,
    "learntime": 0.30054034502245486,
    "sampletime": 8.965008990140632,
    "best_max_mean": 17.007988785544654,
    "best_max": 24.106941965833713
  },
  {
    "gen": 1581,
    "reward_mean": 19.733909582928945,
    "reward_max": 24.112096746067632,
    "reward_min": 1.0098607909696347,
    "reward_std": 4.192717852866346,
    "timesteps": 559841886,
    "learntime": 0.24362802901305258,
    "sampletime": 8.836325286189094,
    "best_max_mean": 19.733909582928945,
    "best_max": 24.112096746067632
  },
  {
    "gen": 1582,
    "reward_mean": 15.97710359988804,
    "reward_max": 22.723727826216024,
    "reward_min": -4.694656720928221,
    "reward_std": 6.253269831112287,
    "timesteps": 560197260,
    "learntime": 0.2945935670286417,
    "sampletime": 8.998458630172536,
    "best_max_mean": 19.733909582928945,
    "best_max": 24.112096746067632
  },
  {
    "gen": 1583,
    "reward_mean": 17.195440495521822,
    "reward_max": 24.534424392026708,
    "reward_min": -0.5755269459985018,
    "reward_std": 6.17682980314602,
    "timesteps": 560553438,
    "learntime": 0.25197753007523715,
    "sampletime": 8.917568568140268,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1584,
    "reward_mean": 16.18755717983493,
    "reward_max": 23.644194312896918,
    "reward_min": -23.280504273095474,
    "reward_std": 7.879899797756705,
    "timesteps": 560907603,
    "learntime": 0.2764492998830974,
    "sampletime": 8.875579829094931,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1585,
    "reward_mean": 17.43475124726513,
    "reward_max": 23.75943376062522,
    "reward_min": -10.859313750371458,
    "reward_std": 6.856205253341742,
    "timesteps": 561262710,
    "learntime": 0.23674303898587823,
    "sampletime": 8.764150460949168,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1586,
    "reward_mean": 18.132412472699507,
    "reward_max": 24.29743057551482,
    "reward_min": 8.733072078843234,
    "reward_std": 5.076702093300457,
    "timesteps": 561618072,
    "learntime": 0.2982071640435606,
    "sampletime": 8.933561073150486,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1587,
    "reward_mean": 19.307112826779722,
    "reward_max": 24.51367637628484,
    "reward_min": 1.238056343671559,
    "reward_std": 4.683532549168481,
    "timesteps": 561975279,
    "learntime": 0.23927257815375924,
    "sampletime": 9.009469995973632,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1588,
    "reward_mean": 18.236936942921496,
    "reward_max": 23.552776588776116,
    "reward_min": 0.41610420927948527,
    "reward_std": 5.850530125618727,
    "timesteps": 562331994,
    "learntime": 0.28226019511930645,
    "sampletime": 8.837583345128223,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1589,
    "reward_mean": 15.859202266540123,
    "reward_max": 23.907134243422963,
    "reward_min": -21.84342266622028,
    "reward_std": 7.666937681167578,
    "timesteps": 562684437,
    "learntime": 0.24558814987540245,
    "sampletime": 8.898029778152704,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1590,
    "reward_mean": 14.889524674057956,
    "reward_max": 23.7347130192599,
    "reward_min": -7.219106858971323,
    "reward_std": 7.972002779956698,
    "timesteps": 563033931,
    "learntime": 0.29746486991643906,
    "sampletime": 8.721470493124798,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1591,
    "reward_mean": 17.170946415928967,
    "reward_max": 23.992127070161096,
    "reward_min": -10.064179126723586,
    "reward_std": 7.296207040513842,
    "timesteps": 563389476,
    "learntime": 0.24366657994687557,
    "sampletime": 8.83840806200169,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1592,
    "reward_mean": 17.074870505534356,
    "reward_max": 24.320533152345103,
    "reward_min": -8.950959841078708,
    "reward_std": 7.14709605843692,
    "timesteps": 563744241,
    "learntime": 0.25051197805441916,
    "sampletime": 8.78122584708035,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1593,
    "reward_mean": 19.345584249659147,
    "reward_max": 23.856925402796175,
    "reward_min": 2.6321678950787573,
    "reward_std": 4.15907377542382,
    "timesteps": 564102678,
    "learntime": 0.24216288793832064,
    "sampletime": 8.945299444021657,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1594,
    "reward_mean": 17.443897629605523,
    "reward_max": 23.5340154173627,
    "reward_min": -1.3823437397497702,
    "reward_std": 6.524905083379756,
    "timesteps": 564456417,
    "learntime": 0.2889441470615566,
    "sampletime": 8.945190137950704,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1595,
    "reward_mean": 19.375707650760805,
    "reward_max": 24.396482499580916,
    "reward_min": 1.9908509452749639,
    "reward_std": 4.7919826265988466,
    "timesteps": 564812922,
    "learntime": 0.24897346808575094,
    "sampletime": 8.899596167961136,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1596,
    "reward_mean": 14.910808487835052,
    "reward_max": 23.714673422763813,
    "reward_min": -22.810096744586193,
    "reward_std": 8.701115278028126,
    "timesteps": 565164819,
    "learntime": 0.28992912685498595,
    "sampletime": 9.023852262180299,
    "best_max_mean": 17.195440495521822,
    "best_max": 24.534424392026708
  },
  {
    "gen": 1597,
    "reward_mean": 13.642681692213058,
    "reward_max": 25.03806481092599,
    "reward_min": -12.158276233506369,
    "reward_std": 10.084259512752343,
    "timesteps": 565512429,
    "learntime": 0.2385645790491253,
    "sampletime": 8.687426388030872,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1598,
    "reward_mean": 13.98221727560836,
    "reward_max": 24.871405508651424,
    "reward_min": -19.810379216514505,
    "reward_std": 10.325126390288903,
    "timesteps": 565862415,
    "learntime": 0.2976406901143491,
    "sampletime": 8.77441768697463,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1599,
    "reward_mean": 13.399626820669823,
    "reward_max": 24.09825791755804,
    "reward_min": -20.75620080403292,
    "reward_std": 9.905683267567495,
    "timesteps": 566208165,
    "learntime": 0.24762397282756865,
    "sampletime": 8.632471336983144,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1600,
    "reward_mean": 9.526398722048214,
    "reward_max": 23.93722127100002,
    "reward_min": -29.463228271875504,
    "reward_std": 11.210046514664564,
    "timesteps": 566554188,
    "learntime": 0.30334376101382077,
    "sampletime": 8.710487249074504,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1601,
    "reward_mean": 16.910758117331056,
    "reward_max": 24.34910291880651,
    "reward_min": -19.48869301507137,
    "reward_std": 7.686583830409563,
    "timesteps": 566907882,
    "learntime": 0.11641813698224723,
    "sampletime": 8.781463637016714,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1602,
    "reward_mean": 13.19814202579486,
    "reward_max": 23.391031582800977,
    "reward_min": -22.51584650302362,
    "reward_std": 9.49700746990534,
    "timesteps": 567257154,
    "learntime": 0.29603565600700676,
    "sampletime": 8.850622934987769,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1603,
    "reward_mean": 16.303656899253262,
    "reward_max": 24.00019393457014,
    "reward_min": -10.298840120720516,
    "reward_std": 7.508169418440398,
    "timesteps": 567610443,
    "learntime": 0.23746171710081398,
    "sampletime": 8.832470843801275,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1604,
    "reward_mean": 16.960139893165078,
    "reward_max": 24.084211759417393,
    "reward_min": -17.22833600660346,
    "reward_std": 7.914031529467972,
    "timesteps": 567963498,
    "learntime": 0.289623964112252,
    "sampletime": 8.776260395068675,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1605,
    "reward_mean": 12.92746850279881,
    "reward_max": 23.82495742892338,
    "reward_min": -16.84352253013155,
    "reward_std": 9.568209394382178,
    "timesteps": 568309773,
    "learntime": 0.2316399731207639,
    "sampletime": 8.730280798859894,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1606,
    "reward_mean": 14.797312584572122,
    "reward_max": 23.54013963680094,
    "reward_min": -7.944867372609838,
    "reward_std": 7.595571042656177,
    "timesteps": 568658457,
    "learntime": 0.28234720905311406,
    "sampletime": 8.80550422007218,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1607,
    "reward_mean": 15.881856035462413,
    "reward_max": 24.425649120067558,
    "reward_min": -10.299470050528543,
    "reward_std": 7.275326992034993,
    "timesteps": 569010681,
    "learntime": 0.24721251497976482,
    "sampletime": 8.801300324965268,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1608,
    "reward_mean": 18.441116218928894,
    "reward_max": 23.301559971800692,
    "reward_min": 2.2806547301906064,
    "reward_std": 5.108915744178957,
    "timesteps": 569368731,
    "learntime": 0.29877052991651,
    "sampletime": 8.810859781922773,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1609,
    "reward_mean": 17.938556509512352,
    "reward_max": 23.805696044455875,
    "reward_min": 8.694661281442897,
    "reward_std": 4.687722257584147,
    "timesteps": 569726655,
    "learntime": 0.24173744698055089,
    "sampletime": 8.76185339782387,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1610,
    "reward_mean": 17.59520853556191,
    "reward_max": 22.788509739048695,
    "reward_min": -0.6855821500419446,
    "reward_std": 5.073340391441755,
    "timesteps": 570082530,
    "learntime": 0.28503617993555963,
    "sampletime": 9.125019490951672,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1611,
    "reward_mean": 18.686038413942747,
    "reward_max": 23.189711338106648,
    "reward_min": 0.5260624823470853,
    "reward_std": 4.699072491005344,
    "timesteps": 570439389,
    "learntime": 0.25831313198432326,
    "sampletime": 8.882865374907851,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1612,
    "reward_mean": 16.24716435289995,
    "reward_max": 22.776324251962997,
    "reward_min": -9.87030907202456,
    "reward_std": 6.7979647624582995,
    "timesteps": 570791250,
    "learntime": 0.2829018069896847,
    "sampletime": 8.684844288975,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1613,
    "reward_mean": 19.24998196780212,
    "reward_max": 23.205508947478265,
    "reward_min": 8.312242480914524,
    "reward_std": 3.5427175590919404,
    "timesteps": 571149825,
    "learntime": 0.24316548486240208,
    "sampletime": 8.878313009161502,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1614,
    "reward_mean": 15.759515163256546,
    "reward_max": 22.9156839014516,
    "reward_min": -1.9651698874788313,
    "reward_std": 6.703045860055598,
    "timesteps": 571501353,
    "learntime": 0.2828468498773873,
    "sampletime": 8.775937892030925,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1615,
    "reward_mean": 18.049560433164125,
    "reward_max": 22.673439246083774,
    "reward_min": 5.973033783102323,
    "reward_std": 4.23357504717193,
    "timesteps": 571859313,
    "learntime": 0.24454719084315002,
    "sampletime": 8.934203305048868,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1616,
    "reward_mean": 18.523408615574816,
    "reward_max": 22.350451913873915,
    "reward_min": 8.51515212965508,
    "reward_std": 3.867121062128241,
    "timesteps": 572217438,
    "learntime": 0.292459286050871,
    "sampletime": 8.994268133072183,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1617,
    "reward_mean": 14.98655608198796,
    "reward_max": 22.53205404251419,
    "reward_min": -2.500202040741871,
    "reward_std": 6.368193159125489,
    "timesteps": 572568342,
    "learntime": 0.24473922792822123,
    "sampletime": 8.839071020949632,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1618,
    "reward_mean": 18.614749027641913,
    "reward_max": 22.013431979664308,
    "reward_min": 7.365209914495196,
    "reward_std": 2.4760626388524565,
    "timesteps": 572928231,
    "learntime": 0.3027650888543576,
    "sampletime": 8.947511938167736,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1619,
    "reward_mean": 16.860411207117018,
    "reward_max": 23.069395073308524,
    "reward_min": 6.870876135586794,
    "reward_std": 4.0667960495623685,
    "timesteps": 573285654,
    "learntime": 0.2420145880896598,
    "sampletime": 8.971555263036862,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1620,
    "reward_mean": 15.572494311373106,
    "reward_max": 21.037855664649125,
    "reward_min": -1.9673749256568636,
    "reward_std": 4.821506309357842,
    "timesteps": 573643050,
    "learntime": 0.2466324099805206,
    "sampletime": 8.880497141974047,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1621,
    "reward_mean": 15.718655027957798,
    "reward_max": 20.869762563605256,
    "reward_min": -5.112654732836585,
    "reward_std": 5.21167677287242,
    "timesteps": 574000716,
    "learntime": 0.27044634986668825,
    "sampletime": 8.841460824944079,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1622,
    "reward_mean": 15.380854969077859,
    "reward_max": 20.190082856635637,
    "reward_min": 4.046778682026672,
    "reward_std": 4.201621862499355,
    "timesteps": 574357434,
    "learntime": 0.25296559487469494,
    "sampletime": 8.853273120010272,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1623,
    "reward_mean": 15.369556066571514,
    "reward_max": 20.703394739726328,
    "reward_min": 5.4244806807731605,
    "reward_std": 3.183518420482225,
    "timesteps": 574715994,
    "learntime": 0.2566437020432204,
    "sampletime": 8.886582233943045,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1624,
    "reward_mean": 15.117699804320157,
    "reward_max": 20.605435473107118,
    "reward_min": -3.0175788847651974,
    "reward_std": 4.7702482025374175,
    "timesteps": 575072667,
    "learntime": 0.2508295220322907,
    "sampletime": 9.033074381994084,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1625,
    "reward_mean": 15.772332510804725,
    "reward_max": 20.804744653812975,
    "reward_min": 5.310199005091843,
    "reward_std": 2.6370919853729804,
    "timesteps": 575432160,
    "learntime": 0.24164391681551933,
    "sampletime": 8.886757761007175,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1626,
    "reward_mean": 15.23067501896053,
    "reward_max": 20.888061257610165,
    "reward_min": 4.512012081026722,
    "reward_std": 2.688588705920145,
    "timesteps": 575791785,
    "learntime": 0.24998554401099682,
    "sampletime": 9.013199387816712,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1627,
    "reward_mean": 14.738725911920824,
    "reward_max": 18.180618911173738,
    "reward_min": 6.394101414974125,
    "reward_std": 2.352861840315372,
    "timesteps": 576152040,
    "learntime": 0.24285421893000603,
    "sampletime": 8.954479022882879,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1628,
    "reward_mean": 14.054763385134958,
    "reward_max": 19.7512018906771,
    "reward_min": 3.009626770236842,
    "reward_std": 4.295786027207729,
    "timesteps": 576509586,
    "learntime": 0.2633651129435748,
    "sampletime": 8.889766711974517,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1629,
    "reward_mean": 14.753829840988018,
    "reward_max": 18.74024888235285,
    "reward_min": 2.997204853790914,
    "reward_std": 3.220997306030584,
    "timesteps": 576868263,
    "learntime": 0.24206849094480276,
    "sampletime": 8.879559570923448,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1630,
    "reward_mean": 15.951600641560747,
    "reward_max": 20.076078166268413,
    "reward_min": 5.860805106851984,
    "reward_std": 2.8113574105120365,
    "timesteps": 577227879,
    "learntime": 0.23837298015132546,
    "sampletime": 8.92772329901345,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1631,
    "reward_mean": 14.860273873456213,
    "reward_max": 19.905838033999313,
    "reward_min": 2.17272714869768,
    "reward_std": 3.551352082103008,
    "timesteps": 577586415,
    "learntime": 0.24051315896213055,
    "sampletime": 9.050549937877804,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1632,
    "reward_mean": 15.404585819261559,
    "reward_max": 21.0004908868649,
    "reward_min": 5.280673934706781,
    "reward_std": 3.048249122515912,
    "timesteps": 577944828,
    "learntime": 0.25005002110265195,
    "sampletime": 8.934333548881114,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1633,
    "reward_mean": 15.627511067824994,
    "reward_max": 20.433393910123307,
    "reward_min": 11.538589247269554,
    "reward_std": 1.908828474498487,
    "timesteps": 578305548,
    "learntime": 0.2455437460448593,
    "sampletime": 8.905311131151393,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1634,
    "reward_mean": 14.542111647829769,
    "reward_max": 17.941063363676548,
    "reward_min": -5.064688448610742,
    "reward_std": 4.171960537224623,
    "timesteps": 578662857,
    "learntime": 0.2519631620962173,
    "sampletime": 8.844437944935635,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1635,
    "reward_mean": 15.784638102436098,
    "reward_max": 20.086805685911603,
    "reward_min": -2.733398561616379,
    "reward_std": 3.58367118412279,
    "timesteps": 579021306,
    "learntime": 0.24204630590975285,
    "sampletime": 8.890677741961554,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1636,
    "reward_mean": 16.16619439566565,
    "reward_max": 21.256841824643992,
    "reward_min": 3.209982248781168,
    "reward_std": 3.8212979469214603,
    "timesteps": 579379821,
    "learntime": 0.24822775390930474,
    "sampletime": 8.955516312969849,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1637,
    "reward_mean": 15.684433229306267,
    "reward_max": 20.400176647140384,
    "reward_min": -0.22204184411547048,
    "reward_std": 4.437098204051972,
    "timesteps": 579737349,
    "learntime": 0.24591665202751756,
    "sampletime": 9.011220746906474,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1638,
    "reward_mean": 16.495381957399886,
    "reward_max": 20.147425130447086,
    "reward_min": 6.304337714750238,
    "reward_std": 3.1833475548893313,
    "timesteps": 580095759,
    "learntime": 0.24531283788383007,
    "sampletime": 8.89594501000829,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1639,
    "reward_mean": 17.17304981400865,
    "reward_max": 20.792404877917956,
    "reward_min": 8.39850137046434,
    "reward_std": 2.8847649720965567,
    "timesteps": 580454532,
    "learntime": 0.2473007421940565,
    "sampletime": 8.927706490969285,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1640,
    "reward_mean": 15.941226903720448,
    "reward_max": 21.020166374139734,
    "reward_min": 6.001211080403831,
    "reward_std": 4.695590847292186,
    "timesteps": 580812843,
    "learntime": 0.23697297694161534,
    "sampletime": 9.00851122615859,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1641,
    "reward_mean": 17.17477226645578,
    "reward_max": 21.13229951563036,
    "reward_min": 6.655099831422735,
    "reward_std": 4.38831065495918,
    "timesteps": 581169810,
    "learntime": 0.2480802338104695,
    "sampletime": 9.011747888987884,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1642,
    "reward_mean": 17.554013196585334,
    "reward_max": 22.051562660804134,
    "reward_min": 6.735520483952393,
    "reward_std": 4.2261446869823285,
    "timesteps": 581526810,
    "learntime": 0.24685637396760285,
    "sampletime": 8.908436940051615,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1643,
    "reward_mean": 17.040347488571513,
    "reward_max": 22.231948560414217,
    "reward_min": -3.9084381944902122,
    "reward_std": 5.339469397952968,
    "timesteps": 581881869,
    "learntime": 0.2408940561581403,
    "sampletime": 8.775993532966822,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1644,
    "reward_mean": 16.340400313882313,
    "reward_max": 22.904306474141777,
    "reward_min": -1.8089392604800223,
    "reward_std": 6.893989067963978,
    "timesteps": 582235563,
    "learntime": 0.2512506260536611,
    "sampletime": 8.863807269837707,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1645,
    "reward_mean": 17.729078648145983,
    "reward_max": 22.88543357347335,
    "reward_min": 1.215278126784444,
    "reward_std": 4.847075740283719,
    "timesteps": 582594447,
    "learntime": 0.2540052100084722,
    "sampletime": 8.887497595045716,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1646,
    "reward_mean": 17.96332578314448,
    "reward_max": 23.027920195966896,
    "reward_min": 0.3920222970217812,
    "reward_std": 5.14774853572999,
    "timesteps": 582950622,
    "learntime": 0.23764219600707293,
    "sampletime": 8.891667306190357,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1647,
    "reward_mean": 18.094092412790683,
    "reward_max": 23.057482212323738,
    "reward_min": -6.516747892539975,
    "reward_std": 6.07154449900666,
    "timesteps": 583306320,
    "learntime": 0.24770251102745533,
    "sampletime": 8.944812156027183,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1648,
    "reward_mean": 17.421477273052822,
    "reward_max": 23.055998009488437,
    "reward_min": -0.5493603186173879,
    "reward_std": 5.846505990397731,
    "timesteps": 583662711,
    "learntime": 0.24649501196108758,
    "sampletime": 8.907167808851227,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1649,
    "reward_mean": 17.78683719564522,
    "reward_max": 23.111434414371615,
    "reward_min": 1.6318804585113817,
    "reward_std": 5.768267913532603,
    "timesteps": 584017737,
    "learntime": 0.24447666993364692,
    "sampletime": 8.76770212710835,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1650,
    "reward_mean": 18.20616410853208,
    "reward_max": 23.602935845907208,
    "reward_min": -0.4562922212309388,
    "reward_std": 6.0885282626599455,
    "timesteps": 584373258,
    "learntime": 0.2599872329737991,
    "sampletime": 8.885754990158603,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1651,
    "reward_mean": 16.247026802778915,
    "reward_max": 23.82874277260888,
    "reward_min": -10.853972567136003,
    "reward_std": 7.399011468221091,
    "timesteps": 584726865,
    "learntime": 0.24253153684549034,
    "sampletime": 8.968781236093491,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1652,
    "reward_mean": 16.28322348393521,
    "reward_max": 23.418064211131874,
    "reward_min": 0.7118948132476998,
    "reward_std": 6.773508483295721,
    "timesteps": 585080232,
    "learntime": 0.25378592498600483,
    "sampletime": 8.81173136504367,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1653,
    "reward_mean": 16.289266618383365,
    "reward_max": 23.262032158595193,
    "reward_min": -11.394007094267929,
    "reward_std": 7.368012442830866,
    "timesteps": 585433251,
    "learntime": 0.26158024300821126,
    "sampletime": 8.80714179808274,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1654,
    "reward_mean": 16.35187275908042,
    "reward_max": 23.2619296030995,
    "reward_min": -5.566320313514254,
    "reward_std": 7.426884688802306,
    "timesteps": 585788025,
    "learntime": 0.24862538208253682,
    "sampletime": 8.805162483127788,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1655,
    "reward_mean": 15.275678501263517,
    "reward_max": 24.624980236545635,
    "reward_min": -7.9030067407357985,
    "reward_std": 7.433773512498333,
    "timesteps": 586141872,
    "learntime": 0.25555757991969585,
    "sampletime": 8.814673949964345,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1656,
    "reward_mean": 16.808627910529648,
    "reward_max": 23.6103992480914,
    "reward_min": 1.9904436609358507,
    "reward_std": 5.458013148611183,
    "timesteps": 586497633,
    "learntime": 0.24125257111154497,
    "sampletime": 8.945109352003783,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1657,
    "reward_mean": 13.907370470844523,
    "reward_max": 24.137684647247866,
    "reward_min": -10.982006799341464,
    "reward_std": 7.895384969796703,
    "timesteps": 586849215,
    "learntime": 0.25066191400401294,
    "sampletime": 8.824342085048556,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1658,
    "reward_mean": 14.096387666332168,
    "reward_max": 24.11867076642617,
    "reward_min": -2.9036994233628692,
    "reward_std": 7.817584379423049,
    "timesteps": 587200758,
    "learntime": 0.2820790410041809,
    "sampletime": 8.84152967017144,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1659,
    "reward_mean": 17.005227706429984,
    "reward_max": 23.959098913766663,
    "reward_min": -8.127766001860222,
    "reward_std": 6.9236687813880975,
    "timesteps": 587554575,
    "learntime": 0.28978018718771636,
    "sampletime": 9.002155235037208,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1660,
    "reward_mean": 13.933149622563427,
    "reward_max": 23.30251554100224,
    "reward_min": -10.944490891962424,
    "reward_std": 8.400665145129121,
    "timesteps": 587906925,
    "learntime": 0.23988362890668213,
    "sampletime": 8.934037999017164,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1661,
    "reward_mean": 16.720369204002182,
    "reward_max": 23.066265354467426,
    "reward_min": -0.9151463921774518,
    "reward_std": 6.55702278856402,
    "timesteps": 588259338,
    "learntime": 0.2515343311242759,
    "sampletime": 8.890710753155872,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1662,
    "reward_mean": 15.316734948877944,
    "reward_max": 23.39839152521583,
    "reward_min": -1.3504097188230288,
    "reward_std": 7.433161709184686,
    "timesteps": 588610152,
    "learntime": 0.2982915500178933,
    "sampletime": 8.749165412038565,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1663,
    "reward_mean": 17.579393845482343,
    "reward_max": 23.78703387117194,
    "reward_min": 1.384800233849966,
    "reward_std": 5.981956545083993,
    "timesteps": 588967464,
    "learntime": 0.2468765820376575,
    "sampletime": 8.884040634147823,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1664,
    "reward_mean": 16.84501284890049,
    "reward_max": 24.007897511999484,
    "reward_min": -6.634626522175199,
    "reward_std": 7.011033682807241,
    "timesteps": 589319781,
    "learntime": 0.3007332067936659,
    "sampletime": 9.004617478931323,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1665,
    "reward_mean": 14.448580982490746,
    "reward_max": 23.892204588532238,
    "reward_min": -18.691033768001944,
    "reward_std": 8.456255971334341,
    "timesteps": 589672911,
    "learntime": 0.24473508796654642,
    "sampletime": 8.818093220936134,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1666,
    "reward_mean": 17.156174195433316,
    "reward_max": 23.465905325375683,
    "reward_min": -1.3046514519660528,
    "reward_std": 7.061776829463153,
    "timesteps": 590028417,
    "learntime": 0.31875825906172395,
    "sampletime": 8.84390956396237,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1667,
    "reward_mean": 13.933489400693936,
    "reward_max": 23.084362242060397,
    "reward_min": -11.11443709164406,
    "reward_std": 7.9023283172220635,
    "timesteps": 590377905,
    "learntime": 0.25678084208630025,
    "sampletime": 9.042027689982206,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1668,
    "reward_mean": 18.070954927204085,
    "reward_max": 23.66472268904644,
    "reward_min": 1.9985405308772968,
    "reward_std": 6.342732930091553,
    "timesteps": 590734551,
    "learntime": 0.2965991389937699,
    "sampletime": 9.019915712997317,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1669,
    "reward_mean": 15.212385466232806,
    "reward_max": 23.651604947281267,
    "reward_min": -9.194458190986715,
    "reward_std": 7.745469782692652,
    "timesteps": 591085650,
    "learntime": 0.24932982702739537,
    "sampletime": 8.745374761056155,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1670,
    "reward_mean": 15.387181295296301,
    "reward_max": 23.625938366893955,
    "reward_min": -11.977604794880433,
    "reward_std": 8.590510077817006,
    "timesteps": 591437163,
    "learntime": 0.3046218070667237,
    "sampletime": 8.652570780133829,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1671,
    "reward_mean": 17.84993484422494,
    "reward_max": 23.57170719949697,
    "reward_min": 1.9540357078764197,
    "reward_std": 5.506436736048706,
    "timesteps": 591794220,
    "learntime": 0.25027533201500773,
    "sampletime": 8.928853658027947,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1672,
    "reward_mean": 18.00073592534175,
    "reward_max": 24.05744842646262,
    "reward_min": -1.468606198170385,
    "reward_std": 5.509667769115501,
    "timesteps": 592151451,
    "learntime": 0.29193201195448637,
    "sampletime": 9.079813539981842,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1673,
    "reward_mean": 16.009418648474963,
    "reward_max": 23.184232071346027,
    "reward_min": -7.5298911340668715,
    "reward_std": 6.604758347978242,
    "timesteps": 592505424,
    "learntime": 0.2554323759395629,
    "sampletime": 8.852693296037614,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1674,
    "reward_mean": 17.357805203509837,
    "reward_max": 23.436628832185466,
    "reward_min": 1.5394618883479736,
    "reward_std": 5.610421596165068,
    "timesteps": 592863111,
    "learntime": 0.29194419411942363,
    "sampletime": 8.86652453104034,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1675,
    "reward_mean": 16.92058879785744,
    "reward_max": 22.194884918259707,
    "reward_min": -1.2825189635270546,
    "reward_std": 6.156816999533007,
    "timesteps": 593218002,
    "learntime": 0.2527640040498227,
    "sampletime": 8.98716067802161,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1676,
    "reward_mean": 17.217948616077226,
    "reward_max": 23.066553131959424,
    "reward_min": -10.026544388707293,
    "reward_std": 6.52124429624646,
    "timesteps": 593573586,
    "learntime": 0.28771066199988127,
    "sampletime": 8.944287220016122,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1677,
    "reward_mean": 18.394937025868508,
    "reward_max": 22.67131322799391,
    "reward_min": 0.15873247191705112,
    "reward_std": 4.909061609572385,
    "timesteps": 593930613,
    "learntime": 0.24662096705287695,
    "sampletime": 8.852198716020212,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1678,
    "reward_mean": 17.05580998309098,
    "reward_max": 22.161743454973802,
    "reward_min": -1.8292445995647328,
    "reward_std": 5.705458037853916,
    "timesteps": 594284418,
    "learntime": 0.3097384839784354,
    "sampletime": 8.83270193496719,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1679,
    "reward_mean": 18.725467302412177,
    "reward_max": 23.258419698534343,
    "reward_min": 8.339855384520803,
    "reward_std": 4.2806030229678536,
    "timesteps": 594640419,
    "learntime": 0.2449746821075678,
    "sampletime": 8.955982910934836,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1680,
    "reward_mean": 18.16121207612478,
    "reward_max": 22.620049300896365,
    "reward_min": -0.3020517125365875,
    "reward_std": 4.760610984800212,
    "timesteps": 594997767,
    "learntime": 0.29654284892603755,
    "sampletime": 8.916470597032458,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1681,
    "reward_mean": 15.293853655668702,
    "reward_max": 22.312583733235382,
    "reward_min": -10.357291251731418,
    "reward_std": 7.204665362469107,
    "timesteps": 595350837,
    "learntime": 0.24455098691396415,
    "sampletime": 8.85848408495076,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1682,
    "reward_mean": 15.69205186532361,
    "reward_max": 22.182964204768783,
    "reward_min": -2.185895766992352,
    "reward_std": 6.558574530351109,
    "timesteps": 595704954,
    "learntime": 0.2978789380285889,
    "sampletime": 8.843257104046643,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1683,
    "reward_mean": 18.270401270474046,
    "reward_max": 22.236395914601445,
    "reward_min": -0.6540655129515062,
    "reward_std": 4.249307923411638,
    "timesteps": 596062251,
    "learntime": 0.24133079801686108,
    "sampletime": 8.988729681121185,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1684,
    "reward_mean": 18.390842680008255,
    "reward_max": 21.68736630558851,
    "reward_min": -2.2330565405268743,
    "reward_std": 4.217315219155554,
    "timesteps": 596420625,
    "learntime": 0.3003386971540749,
    "sampletime": 8.864328228868544,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1685,
    "reward_mean": 14.782927981651621,
    "reward_max": 20.994036638837617,
    "reward_min": -9.705177123775181,
    "reward_std": 6.820666152059442,
    "timesteps": 596775018,
    "learntime": 0.25365628697909415,
    "sampletime": 8.998577676014975,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1686,
    "reward_mean": 16.403547166575272,
    "reward_max": 21.58771047850358,
    "reward_min": 1.26322088950029,
    "reward_std": 4.9202368101450915,
    "timesteps": 597130440,
    "learntime": 0.28646198101341724,
    "sampletime": 8.90302961692214,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1687,
    "reward_mean": 15.18961590342812,
    "reward_max": 20.485312418662943,
    "reward_min": -12.07985703445351,
    "reward_std": 6.400247904506032,
    "timesteps": 597484134,
    "learntime": 0.2630055060144514,
    "sampletime": 8.927599382819608,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1688,
    "reward_mean": 13.504186945692684,
    "reward_max": 19.72866737055345,
    "reward_min": -1.4068842717926204,
    "reward_std": 5.469441298703375,
    "timesteps": 597837273,
    "learntime": 0.304941319860518,
    "sampletime": 8.854617398930714,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1689,
    "reward_mean": 14.1468682155264,
    "reward_max": 19.929216675263078,
    "reward_min": -11.167874439931692,
    "reward_std": 6.19726698779731,
    "timesteps": 598191000,
    "learntime": 0.2451107248198241,
    "sampletime": 8.846619348041713,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1690,
    "reward_mean": 15.035825745088914,
    "reward_max": 19.11457318697339,
    "reward_min": -4.790804257313021,
    "reward_std": 5.194532861069142,
    "timesteps": 598547067,
    "learntime": 0.2998801930807531,
    "sampletime": 9.117479074047878,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1691,
    "reward_mean": 15.107983083274897,
    "reward_max": 19.586428697778366,
    "reward_min": -2.9585513638854617,
    "reward_std": 5.477589652534871,
    "timesteps": 598902990,
    "learntime": 0.24486206797882915,
    "sampletime": 8.786182356067002,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1692,
    "reward_mean": 13.715482723971558,
    "reward_max": 18.591402478895827,
    "reward_min": 2.778631777356267,
    "reward_std": 4.517853155847109,
    "timesteps": 599258928,
    "learntime": 0.24308840814046562,
    "sampletime": 8.929657449014485,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1693,
    "reward_mean": 13.510386568488638,
    "reward_max": 18.942500629713727,
    "reward_min": -4.4802830656073285,
    "reward_std": 5.7414619758392025,
    "timesteps": 599611995,
    "learntime": 0.25043923198245466,
    "sampletime": 8.890078695025295,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1694,
    "reward_mean": 16.435902549232765,
    "reward_max": 18.169737037638143,
    "reward_min": 12.477164093267424,
    "reward_std": 1.095806274027581,
    "timesteps": 599972715,
    "learntime": 0.2503137169405818,
    "sampletime": 9.033577722962946,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1695,
    "reward_mean": 14.07572290344099,
    "reward_max": 20.05204913535183,
    "reward_min": -4.952864339903255,
    "reward_std": 5.369538697621548,
    "timesteps": 600329640,
    "learntime": 0.2517185958568007,
    "sampletime": 8.994418344926089,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1696,
    "reward_mean": 13.694998214792268,
    "reward_max": 18.03119843123326,
    "reward_min": 3.5344515574520914,
    "reward_std": 4.415517093668852,
    "timesteps": 600686148,
    "learntime": 0.2523047961294651,
    "sampletime": 9.010861040093005,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1697,
    "reward_mean": 14.45553067487371,
    "reward_max": 17.824315349003438,
    "reward_min": 3.7256005411230326,
    "reward_std": 3.6674811484724317,
    "timesteps": 601043697,
    "learntime": 0.23996350588276982,
    "sampletime": 9.187826995970681,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1698,
    "reward_mean": 10.434696986418565,
    "reward_max": 17.68229111210288,
    "reward_min": -12.120004155259172,
    "reward_std": 7.16177609629691,
    "timesteps": 601394040,
    "learntime": 0.24868171103298664,
    "sampletime": 8.907885435037315,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1699,
    "reward_mean": 13.236977338429478,
    "reward_max": 18.274184633208655,
    "reward_min": -8.313002796907147,
    "reward_std": 4.680135730553378,
    "timesteps": 601749951,
    "learntime": 0.25459463498555124,
    "sampletime": 8.967015764908865,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1700,
    "reward_mean": 11.595831126888104,
    "reward_max": 18.277833322726302,
    "reward_min": -5.684291305929509,
    "reward_std": 6.107483087720412,
    "timesteps": 602100090,
    "learntime": 0.2452050498686731,
    "sampletime": 8.81029408518225,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1701,
    "reward_mean": 10.968048071725793,
    "reward_max": 18.386318363348074,
    "reward_min": -5.314279895597517,
    "reward_std": 6.980102262496899,
    "timesteps": 602448996,
    "learntime": 0.24923373712226748,
    "sampletime": 8.84965294902213,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1702,
    "reward_mean": 7.588963028318729,
    "reward_max": 18.81987034715712,
    "reward_min": -25.281800685612712,
    "reward_std": 8.993497249287133,
    "timesteps": 602790612,
    "learntime": 0.2567703318782151,
    "sampletime": 8.619417668087408,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1703,
    "reward_mean": 8.653629946293432,
    "reward_max": 17.959854836406727,
    "reward_min": -14.60437670041045,
    "reward_std": 8.550993519380084,
    "timesteps": 603135255,
    "learntime": 0.2547332749236375,
    "sampletime": 8.776221927953884,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1704,
    "reward_mean": 9.649469318288734,
    "reward_max": 18.851363233436135,
    "reward_min": -14.497629071021402,
    "reward_std": 7.796207851048302,
    "timesteps": 603481761,
    "learntime": 0.2574516299646348,
    "sampletime": 8.743822599062696,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1705,
    "reward_mean": 9.750538391940534,
    "reward_max": 18.602227318035943,
    "reward_min": -13.07744809265503,
    "reward_std": 8.146478953741363,
    "timesteps": 603827190,
    "learntime": 0.23937834613025188,
    "sampletime": 8.75596180302091,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1706,
    "reward_mean": 10.799798517800538,
    "reward_max": 18.314587804390058,
    "reward_min": -26.82474341892433,
    "reward_std": 9.348923060334622,
    "timesteps": 604175430,
    "learntime": 0.2497479401063174,
    "sampletime": 8.628746049944311,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1707,
    "reward_mean": 8.580700200800987,
    "reward_max": 17.631556842232715,
    "reward_min": -23.536061166302353,
    "reward_std": 8.127309125907816,
    "timesteps": 604519779,
    "learntime": 0.25310719083063304,
    "sampletime": 8.722318759886548,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1708,
    "reward_mean": 7.594264124925472,
    "reward_max": 18.68341719826232,
    "reward_min": -22.935496646463772,
    "reward_std": 8.986244122319594,
    "timesteps": 604860309,
    "learntime": 0.249531403882429,
    "sampletime": 8.796269454993308,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1709,
    "reward_mean": 8.828487824981472,
    "reward_max": 18.851894902326453,
    "reward_min": -12.440420865224569,
    "reward_std": 8.267306900911507,
    "timesteps": 605202939,
    "learntime": 0.25144764385186136,
    "sampletime": 8.675736907869577,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1710,
    "reward_mean": 9.479121638731863,
    "reward_max": 19.248837828234006,
    "reward_min": -13.669711781284692,
    "reward_std": 9.191070831433084,
    "timesteps": 605547711,
    "learntime": 0.2545439079403877,
    "sampletime": 8.664678402012214,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1711,
    "reward_mean": 6.605392496081935,
    "reward_max": 19.16346757436662,
    "reward_min": -14.436066641651259,
    "reward_std": 8.995462973472833,
    "timesteps": 605887017,
    "learntime": 0.24761882098391652,
    "sampletime": 8.71038687415421,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1712,
    "reward_mean": 4.245259663237126,
    "reward_max": 18.497681407003913,
    "reward_min": -23.881688263986938,
    "reward_std": 10.30617781567769,
    "timesteps": 606219687,
    "learntime": 0.24512037890963256,
    "sampletime": 8.67868810100481,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1713,
    "reward_mean": 6.575235716218815,
    "reward_max": 19.4014289063505,
    "reward_min": -33.49582092056164,
    "reward_std": 10.751926612845365,
    "timesteps": 606554541,
    "learntime": 0.253844273975119,
    "sampletime": 8.411444265162572,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1714,
    "reward_mean": -0.623091620684529,
    "reward_max": 18.063987953595422,
    "reward_min": -34.250985710617066,
    "reward_std": 12.330031356141342,
    "timesteps": 606876777,
    "learntime": 0.2532362719066441,
    "sampletime": 8.522003018064424,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1715,
    "reward_mean": -4.486254514745024,
    "reward_max": 18.205149613874678,
    "reward_min": -43.549596369379394,
    "reward_std": 14.37233578221293,
    "timesteps": 607183722,
    "learntime": 0.24988302285782993,
    "sampletime": 8.30231852689758,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1716,
    "reward_mean": -8.98604528016605,
    "reward_max": 17.170157536976287,
    "reward_min": -44.52778957807812,
    "reward_std": 13.089227458058193,
    "timesteps": 607481916,
    "learntime": 0.25834752107039094,
    "sampletime": 8.122780038043857,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1717,
    "reward_mean": -12.626661770450719,
    "reward_max": 17.168779395040914,
    "reward_min": -45.836923641117416,
    "reward_std": 14.551594913300445,
    "timesteps": 607770996,
    "learntime": 0.24768834095448256,
    "sampletime": 7.898105815984309,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1718,
    "reward_mean": -14.826706353401896,
    "reward_max": 17.586862680361126,
    "reward_min": -53.342025930626164,
    "reward_std": 17.182933225465757,
    "timesteps": 608052102,
    "learntime": 0.25142534892074764,
    "sampletime": 7.532857062062249,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1719,
    "reward_mean": -15.17722734939898,
    "reward_max": 17.462490629246037,
    "reward_min": -57.45923189825327,
    "reward_std": 15.769829976868188,
    "timesteps": 608335353,
    "learntime": 0.2621981028933078,
    "sampletime": 7.913702739868313,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1720,
    "reward_mean": -13.218534327761745,
    "reward_max": 16.877158062003378,
    "reward_min": -45.96784829170528,
    "reward_std": 16.180441726680222,
    "timesteps": 608621007,
    "learntime": 0.25617680395953357,
    "sampletime": 7.719016982940957,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1721,
    "reward_mean": -22.77239782720968,
    "reward_max": 4.976130410774863,
    "reward_min": -55.03832821736719,
    "reward_std": 15.255107776968574,
    "timesteps": 608882343,
    "learntime": 0.2500308998860419,
    "sampletime": 7.6659680139273405,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1722,
    "reward_mean": -24.10447005044523,
    "reward_max": 17.619559585731214,
    "reward_min": -75.45859693920339,
    "reward_std": 20.456448900931072,
    "timesteps": 609137679,
    "learntime": 0.25308444490656257,
    "sampletime": 7.345161663135514,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1723,
    "reward_mean": -23.236351968877564,
    "reward_max": 7.318971841363235,
    "reward_min": -65.4663098136697,
    "reward_std": 19.363579298082247,
    "timesteps": 609400272,
    "learntime": 0.2427378019783646,
    "sampletime": 7.516551878070459,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1724,
    "reward_mean": -24.208788138749874,
    "reward_max": 16.660356345844004,
    "reward_min": -73.3391108804446,
    "reward_std": 19.59890481933491,
    "timesteps": 609657426,
    "learntime": 0.2527808740269393,
    "sampletime": 7.091440371936187,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1725,
    "reward_mean": -21.770344288452627,
    "reward_max": 16.770713232942697,
    "reward_min": -68.81962057867915,
    "reward_std": 17.20507540955013,
    "timesteps": 609921483,
    "learntime": 0.2542155599221587,
    "sampletime": 7.554121502209455,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1726,
    "reward_mean": -6.082166863797594,
    "reward_max": 17.836508744450953,
    "reward_min": -45.16184313593179,
    "reward_std": 15.22894373194468,
    "timesteps": 610225164,
    "learntime": 0.2578510669991374,
    "sampletime": 8.32416188204661,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1727,
    "reward_mean": -0.3812953860621815,
    "reward_max": 16.898407310871534,
    "reward_min": -35.32183342082709,
    "reward_std": 12.788058410832488,
    "timesteps": 610546053,
    "learntime": 0.2614228550810367,
    "sampletime": 8.088838140014559,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1728,
    "reward_mean": -1.5740054598623174,
    "reward_max": 18.973386853146643,
    "reward_min": -43.6258055096771,
    "reward_std": 12.762105054745295,
    "timesteps": 610863177,
    "learntime": 0.25227277004159987,
    "sampletime": 8.062432951992378,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1729,
    "reward_mean": -2.647933677677608,
    "reward_max": 17.382606260333855,
    "reward_min": -44.514201077378615,
    "reward_std": 12.960386819974302,
    "timesteps": 611179224,
    "learntime": 0.2614771381486207,
    "sampletime": 8.433601133991033,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1730,
    "reward_mean": 5.46155901992603,
    "reward_max": 17.736921393058513,
    "reward_min": -20.396451898103503,
    "reward_std": 9.497049878537613,
    "timesteps": 611516865,
    "learntime": 0.24996273196302354,
    "sampletime": 8.519290597876534,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1731,
    "reward_mean": 6.852221464128292,
    "reward_max": 18.043213607249495,
    "reward_min": -14.66761360314647,
    "reward_std": 7.921025693718898,
    "timesteps": 611854017,
    "learntime": 0.2552045560441911,
    "sampletime": 8.595271267928183,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1732,
    "reward_mean": 5.119168366183969,
    "reward_max": 17.495869371069904,
    "reward_min": -25.442444018509846,
    "reward_std": 10.854071153852463,
    "timesteps": 612188934,
    "learntime": 0.25061822310090065,
    "sampletime": 8.343885950976983,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1733,
    "reward_mean": 7.923695691206137,
    "reward_max": 17.65014830820049,
    "reward_min": -13.898094282993549,
    "reward_std": 8.967585595221243,
    "timesteps": 612531705,
    "learntime": 0.2501306349877268,
    "sampletime": 8.769512493163347,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1734,
    "reward_mean": 10.752520209060828,
    "reward_max": 17.732989932782374,
    "reward_min": -6.389457464900758,
    "reward_std": 6.976662511848277,
    "timesteps": 612882036,
    "learntime": 0.24478647811338305,
    "sampletime": 8.942380663007498,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1735,
    "reward_mean": 3.69093604341771,
    "reward_max": 17.79096231917554,
    "reward_min": -16.28894012785256,
    "reward_std": 10.041675558928109,
    "timesteps": 613215468,
    "learntime": 0.25038065598346293,
    "sampletime": 8.559205543948337,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1736,
    "reward_mean": 7.697949817371683,
    "reward_max": 18.631581733805238,
    "reward_min": -20.229226886611688,
    "reward_std": 8.794507137527425,
    "timesteps": 613554642,
    "learntime": 0.2561996039003134,
    "sampletime": 8.756586090894416,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1737,
    "reward_mean": 9.355153879091809,
    "reward_max": 17.69609206756859,
    "reward_min": -6.084948293003964,
    "reward_std": 6.775269209266997,
    "timesteps": 613902960,
    "learntime": 0.2479419158771634,
    "sampletime": 8.760117080062628,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1738,
    "reward_mean": 8.968929205025542,
    "reward_max": 18.03966806985489,
    "reward_min": -16.874351881620846,
    "reward_std": 7.76018515622419,
    "timesteps": 614248770,
    "learntime": 0.24469417380169034,
    "sampletime": 8.69668860710226,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1739,
    "reward_mean": 9.248942184181722,
    "reward_max": 16.219956968970966,
    "reward_min": -16.10678115588345,
    "reward_std": 6.736685991339094,
    "timesteps": 614595198,
    "learntime": 0.25182592892087996,
    "sampletime": 8.808629635954276,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1740,
    "reward_mean": 8.429044521811383,
    "reward_max": 17.103422846673332,
    "reward_min": -17.44561112075021,
    "reward_std": 8.171658447306339,
    "timesteps": 614940705,
    "learntime": 0.25383250904269516,
    "sampletime": 8.8557406028267,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1741,
    "reward_mean": 10.296672908993294,
    "reward_max": 17.185803712102242,
    "reward_min": -12.317354627575298,
    "reward_std": 6.302869886159559,
    "timesteps": 615292638,
    "learntime": 0.24590217415243387,
    "sampletime": 8.88306780392304,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1742,
    "reward_mean": 8.85542607014169,
    "reward_max": 15.66147377667948,
    "reward_min": -6.7631000191058,
    "reward_std": 6.247792517654497,
    "timesteps": 615641808,
    "learntime": 0.251312404172495,
    "sampletime": 8.782226886134595,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1743,
    "reward_mean": 12.204504774291976,
    "reward_max": 16.39877644214192,
    "reward_min": -2.936086243403914,
    "reward_std": 4.065665651511689,
    "timesteps": 615999876,
    "learntime": 0.26087703788653016,
    "sampletime": 8.99219634803012,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1744,
    "reward_mean": 9.873997813937311,
    "reward_max": 16.791044200389553,
    "reward_min": -15.329532883807342,
    "reward_std": 7.33302033508114,
    "timesteps": 616352427,
    "learntime": 0.2564039269927889,
    "sampletime": 8.931132526136935,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1745,
    "reward_mean": 10.632755963814187,
    "reward_max": 16.049702234091736,
    "reward_min": 0.008295015386077768,
    "reward_std": 3.5390479004926716,
    "timesteps": 616709688,
    "learntime": 0.2431601530406624,
    "sampletime": 8.948860657867044,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1746,
    "reward_mean": 8.040454421661035,
    "reward_max": 15.386969236173725,
    "reward_min": -9.90289945040202,
    "reward_std": 7.1173290465562635,
    "timesteps": 617058396,
    "learntime": 0.25985182309523225,
    "sampletime": 8.776642310898751,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1747,
    "reward_mean": 10.489449379863176,
    "reward_max": 15.733114690513402,
    "reward_min": -7.7209089418121835,
    "reward_std": 5.244874239409666,
    "timesteps": 617414025,
    "learntime": 0.2562084498349577,
    "sampletime": 8.985798215959221,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1748,
    "reward_mean": 10.053002566161222,
    "reward_max": 16.276784188670316,
    "reward_min": -17.05554228847508,
    "reward_std": 5.866796662631087,
    "timesteps": 617767194,
    "learntime": 0.250563157023862,
    "sampletime": 8.901237362995744,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1749,
    "reward_mean": 9.918758836057771,
    "reward_max": 15.30701646713758,
    "reward_min": -4.90691823328315,
    "reward_std": 5.311053969210867,
    "timesteps": 618120447,
    "learntime": 0.2574176900088787,
    "sampletime": 9.064231178024784,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1750,
    "reward_mean": 11.002183345544239,
    "reward_max": 15.340707581843043,
    "reward_min": -6.913965712788115,
    "reward_std": 4.426162583163968,
    "timesteps": 618476850,
    "learntime": 0.25309882895089686,
    "sampletime": 9.021081252023578,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1751,
    "reward_mean": 9.358022269720568,
    "reward_max": 15.423492774091246,
    "reward_min": -16.929024719033453,
    "reward_std": 6.529357836577268,
    "timesteps": 618828672,
    "learntime": 0.2546056790743023,
    "sampletime": 8.917224528966472,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1752,
    "reward_mean": 10.046091280846024,
    "reward_max": 15.353566951626403,
    "reward_min": -9.372738167911654,
    "reward_std": 4.336587156255017,
    "timesteps": 619185690,
    "learntime": 0.2499439031817019,
    "sampletime": 8.928570786025375,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1753,
    "reward_mean": 10.569081723450427,
    "reward_max": 15.382587896871634,
    "reward_min": -7.679721458652759,
    "reward_std": 4.529511617177131,
    "timesteps": 619541877,
    "learntime": 0.2528041040059179,
    "sampletime": 8.981895194854587,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1754,
    "reward_mean": 10.565547785152665,
    "reward_max": 14.781983783832839,
    "reward_min": 0.23634089469366146,
    "reward_std": 3.1346301538156824,
    "timesteps": 619900446,
    "learntime": 0.27366137807257473,
    "sampletime": 8.957217623945326,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1755,
    "reward_mean": 9.15387603238108,
    "reward_max": 14.56919947264109,
    "reward_min": -18.759404005158242,
    "reward_std": 6.433259250917403,
    "timesteps": 620254518,
    "learntime": 0.2590049300342798,
    "sampletime": 8.969591319095343,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1756,
    "reward_mean": 8.336386324848892,
    "reward_max": 15.423801817938289,
    "reward_min": -9.245979009695779,
    "reward_std": 5.910499087685395,
    "timesteps": 620606925,
    "learntime": 0.2559752210509032,
    "sampletime": 8.886173714883626,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1757,
    "reward_mean": 10.763041250464727,
    "reward_max": 15.028458903915533,
    "reward_min": -5.667596090229282,
    "reward_std": 3.980342037037294,
    "timesteps": 620965170,
    "learntime": 0.25490026106126606,
    "sampletime": 8.974403952015564,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1758,
    "reward_mean": 9.97196434192082,
    "reward_max": 15.403741584780317,
    "reward_min": -7.1778400380686485,
    "reward_std": 5.0177447236374135,
    "timesteps": 621320388,
    "learntime": 0.2588416440412402,
    "sampletime": 8.946717499056831,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1759,
    "reward_mean": 10.244132718463357,
    "reward_max": 15.220627358153274,
    "reward_min": -6.422996853343253,
    "reward_std": 5.234007503821928,
    "timesteps": 621675726,
    "learntime": 0.25460836407728493,
    "sampletime": 8.819685531081632,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1760,
    "reward_mean": 7.850370847890831,
    "reward_max": 13.927164530907184,
    "reward_min": -8.986867615692036,
    "reward_std": 5.989504331565649,
    "timesteps": 622028622,
    "learntime": 0.25074384501203895,
    "sampletime": 8.785565865924582,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1761,
    "reward_mean": 10.536291050984362,
    "reward_max": 14.529099953427881,
    "reward_min": 0.5398094678989053,
    "reward_std": 3.838208020256366,
    "timesteps": 622384797,
    "learntime": 0.24773020599968731,
    "sampletime": 9.008261950919405,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1762,
    "reward_mean": 10.26464076253625,
    "reward_max": 15.37034515128824,
    "reward_min": -3.937332527322321,
    "reward_std": 4.469022594945345,
    "timesteps": 622739475,
    "learntime": 0.24963319883681834,
    "sampletime": 8.985654366901144,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1763,
    "reward_mean": 11.475608616705273,
    "reward_max": 15.606836071377266,
    "reward_min": -4.779036771835916,
    "reward_std": 4.403701783789447,
    "timesteps": 623096949,
    "learntime": 0.25134809012524784,
    "sampletime": 8.989593612961471,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1764,
    "reward_mean": 9.466176718980268,
    "reward_max": 16.53922331818577,
    "reward_min": -4.986194826027555,
    "reward_std": 5.511231915516575,
    "timesteps": 623449782,
    "learntime": 0.25378263113088906,
    "sampletime": 8.826424694852903,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1765,
    "reward_mean": 12.283469951270407,
    "reward_max": 16.44039252345542,
    "reward_min": 1.6521993485335804,
    "reward_std": 3.298681411004851,
    "timesteps": 623808348,
    "learntime": 0.2657443662174046,
    "sampletime": 9.041532458039,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1766,
    "reward_mean": 11.363985755956563,
    "reward_max": 15.635813130700791,
    "reward_min": 1.6603341504704785,
    "reward_std": 3.9001604427298093,
    "timesteps": 624166500,
    "learntime": 0.2609494118951261,
    "sampletime": 8.848824898945168,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1767,
    "reward_mean": 11.37344794688319,
    "reward_max": 17.1234114428393,
    "reward_min": -4.8800388503339995,
    "reward_std": 4.5170551350746155,
    "timesteps": 624523065,
    "learntime": 0.24804212106391788,
    "sampletime": 8.873745281947777,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1768,
    "reward_mean": 11.177796785710104,
    "reward_max": 16.146269028554805,
    "reward_min": -6.380511084148157,
    "reward_std": 5.250171124523328,
    "timesteps": 624878829,
    "learntime": 0.25834028190001845,
    "sampletime": 8.824801967013627,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1769,
    "reward_mean": 9.273899348808808,
    "reward_max": 16.362745033280756,
    "reward_min": -7.744118271974117,
    "reward_std": 6.138208909912472,
    "timesteps": 625229298,
    "learntime": 0.25638851686380804,
    "sampletime": 8.76289996295236,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1770,
    "reward_mean": 11.543199211259054,
    "reward_max": 16.519390760697807,
    "reward_min": -3.148077482967922,
    "reward_std": 4.493970659279077,
    "timesteps": 625584450,
    "learntime": 0.26070997188799083,
    "sampletime": 8.709430115995929,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1771,
    "reward_mean": 12.924704577735177,
    "reward_max": 16.53379390479919,
    "reward_min": -3.2525299438381334,
    "reward_std": 4.1285932328840556,
    "timesteps": 625941576,
    "learntime": 0.26033867499791086,
    "sampletime": 8.867972640087828,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1772,
    "reward_mean": 9.894932992051254,
    "reward_max": 17.642654147507113,
    "reward_min": -7.21737256362174,
    "reward_std": 7.088238306915911,
    "timesteps": 626291880,
    "learntime": 0.26578496489673853,
    "sampletime": 8.828899122076109,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1773,
    "reward_mean": 12.083268774929788,
    "reward_max": 17.70858613951273,
    "reward_min": -5.236901291233322,
    "reward_std": 5.704643425330066,
    "timesteps": 626646573,
    "learntime": 0.2609023340046406,
    "sampletime": 8.723334785085171,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1774,
    "reward_mean": 12.405563435425982,
    "reward_max": 19.99414340524571,
    "reward_min": -12.93770314258857,
    "reward_std": 5.6336974553019825,
    "timesteps": 627001023,
    "learntime": 0.25772929284721613,
    "sampletime": 8.845137997996062,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1775,
    "reward_mean": 10.580051806476831,
    "reward_max": 17.64259041959391,
    "reward_min": -3.7265023261486836,
    "reward_std": 6.135703095173565,
    "timesteps": 627353679,
    "learntime": 0.2580685520078987,
    "sampletime": 8.817437618970871,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1776,
    "reward_mean": 10.469261028530065,
    "reward_max": 18.496704961448387,
    "reward_min": -4.890484962799364,
    "reward_std": 7.291397253253689,
    "timesteps": 627705897,
    "learntime": 0.25440804613754153,
    "sampletime": 8.854536053026095,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1777,
    "reward_mean": 12.669254437325062,
    "reward_max": 18.602818687051307,
    "reward_min": -4.051157441392371,
    "reward_std": 6.2870303651507,
    "timesteps": 628060089,
    "learntime": 0.25923963100649416,
    "sampletime": 8.851938142208382,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1778,
    "reward_mean": 13.040973172736818,
    "reward_max": 19.665705566950646,
    "reward_min": -6.06255230489611,
    "reward_std": 5.857791522997457,
    "timesteps": 628414221,
    "learntime": 0.24950709100812674,
    "sampletime": 8.853427038062364,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1779,
    "reward_mean": 10.291916203848086,
    "reward_max": 19.231651371934053,
    "reward_min": -15.68422891650787,
    "reward_std": 8.660999524198312,
    "timesteps": 628763337,
    "learntime": 0.255846698069945,
    "sampletime": 8.931765925139189,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1780,
    "reward_mean": 7.804196420225247,
    "reward_max": 18.962696280530906,
    "reward_min": -21.52903988547483,
    "reward_std": 9.257589674240188,
    "timesteps": 629107701,
    "learntime": 0.256527396151796,
    "sampletime": 8.890651346184313,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1781,
    "reward_mean": 8.235140171666128,
    "reward_max": 19.403853623610402,
    "reward_min": -14.63271856372895,
    "reward_std": 9.448787112548514,
    "timesteps": 629456085,
    "learntime": 0.2568994448520243,
    "sampletime": 8.731844030087814,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1782,
    "reward_mean": 8.47769328166408,
    "reward_max": 19.616701836006317,
    "reward_min": -15.674433968568339,
    "reward_std": 8.68378777420771,
    "timesteps": 629804022,
    "learntime": 0.2591162291355431,
    "sampletime": 8.74800429889001,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1783,
    "reward_mean": 6.209482841758717,
    "reward_max": 19.424853697482664,
    "reward_min": -14.411476592561513,
    "reward_std": 9.365828768975035,
    "timesteps": 630152103,
    "learntime": 0.25760371796786785,
    "sampletime": 8.78412596997805,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1784,
    "reward_mean": 10.001056586896812,
    "reward_max": 19.425714980415776,
    "reward_min": -12.151320936384076,
    "reward_std": 9.108593353253443,
    "timesteps": 630500763,
    "learntime": 0.26422916911542416,
    "sampletime": 8.884627474937588,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1785,
    "reward_mean": 11.181066401102608,
    "reward_max": 20.27112571555578,
    "reward_min": -3.862330160738732,
    "reward_std": 7.859507355839869,
    "timesteps": 630850230,
    "learntime": 0.24773467099294066,
    "sampletime": 8.808279741089791,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1786,
    "reward_mean": 14.077722187541065,
    "reward_max": 21.117832885670587,
    "reward_min": -3.3480865845569614,
    "reward_std": 6.160485331154308,
    "timesteps": 631205358,
    "learntime": 0.24574814992956817,
    "sampletime": 9.073711378965527,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1787,
    "reward_mean": 8.073442329264791,
    "reward_max": 19.98916485465386,
    "reward_min": -21.744195089632264,
    "reward_std": 11.209002436813533,
    "timesteps": 631548561,
    "learntime": 0.2664267981890589,
    "sampletime": 8.667855308856815,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1788,
    "reward_mean": 11.252958489370414,
    "reward_max": 18.84191713212446,
    "reward_min": -11.079499194754234,
    "reward_std": 7.392858016092068,
    "timesteps": 631898199,
    "learntime": 0.26054429984651506,
    "sampletime": 8.793950793100521,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1789,
    "reward_mean": 12.906263176239946,
    "reward_max": 19.26897412731848,
    "reward_min": -12.892565766829206,
    "reward_std": 6.136529642857003,
    "timesteps": 632254128,
    "learntime": 0.2536680439952761,
    "sampletime": 8.97279132087715,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1790,
    "reward_mean": 10.597740020961295,
    "reward_max": 19.12288653266538,
    "reward_min": -6.387475985345772,
    "reward_std": 6.696359974387617,
    "timesteps": 632607936,
    "learntime": 0.25576937198638916,
    "sampletime": 8.871942749014124,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1791,
    "reward_mean": 12.753775965507417,
    "reward_max": 19.219595939984874,
    "reward_min": -2.3989340578149476,
    "reward_std": 5.803167217667967,
    "timesteps": 632963280,
    "learntime": 0.2716064869891852,
    "sampletime": 8.926387764047831,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1792,
    "reward_mean": 9.812682188878913,
    "reward_max": 18.670751421864033,
    "reward_min": -22.22256243324867,
    "reward_std": 9.091584116948033,
    "timesteps": 633314817,
    "learntime": 0.26479264814406633,
    "sampletime": 8.878802370047197,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1793,
    "reward_mean": 14.529079852471217,
    "reward_max": 19.74200197408208,
    "reward_min": -3.4564504931172952,
    "reward_std": 5.051560893185201,
    "timesteps": 633669534,
    "learntime": 0.25925781414844096,
    "sampletime": 9.02595006278716,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1794,
    "reward_mean": 8.732819396889326,
    "reward_max": 19.936791391208924,
    "reward_min": -21.49741126212434,
    "reward_std": 9.246178439531983,
    "timesteps": 634016898,
    "learntime": 0.25523788295686245,
    "sampletime": 8.773951924173161,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1795,
    "reward_mean": 13.251037699332684,
    "reward_max": 19.3339376439284,
    "reward_min": -3.446559900463783,
    "reward_std": 5.397052740215408,
    "timesteps": 634370886,
    "learntime": 0.25370831112377346,
    "sampletime": 8.908131357980892,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1796,
    "reward_mean": 11.171449424048557,
    "reward_max": 20.123788519003988,
    "reward_min": -11.80677301846586,
    "reward_std": 7.22923026076038,
    "timesteps": 634723416,
    "learntime": 0.24684311682358384,
    "sampletime": 8.814778458094224,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1797,
    "reward_mean": 10.297142856816293,
    "reward_max": 18.672882994079508,
    "reward_min": -23.293023725361284,
    "reward_std": 7.838741979807724,
    "timesteps": 635076816,
    "learntime": 0.3026396599598229,
    "sampletime": 8.817568515893072,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1798,
    "reward_mean": 10.163241120598018,
    "reward_max": 19.51961276286535,
    "reward_min": -12.578552951104939,
    "reward_std": 7.87039959201827,
    "timesteps": 635429694,
    "learntime": 0.25845327181741595,
    "sampletime": 8.82332905405201,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1799,
    "reward_mean": 14.082255544020278,
    "reward_max": 19.560141019419664,
    "reward_min": -2.940647613990943,
    "reward_std": 5.464588872151331,
    "timesteps": 635787324,
    "learntime": 0.25264264899306,
    "sampletime": 9.077005452942103,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1800,
    "reward_mean": 15.131841993929953,
    "reward_max": 18.47924087441061,
    "reward_min": -2.010067212663481,
    "reward_std": 3.3137877446920396,
    "timesteps": 636147039,
    "learntime": 0.26044438197277486,
    "sampletime": 8.962222813861445,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1801,
    "reward_mean": 10.435937114263504,
    "reward_max": 19.58092706975048,
    "reward_min": -21.439152860014342,
    "reward_std": 9.162476774541721,
    "timesteps": 636499758,
    "learntime": 0.1183112149592489,
    "sampletime": 8.80202525597997,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1802,
    "reward_mean": 11.75972236261582,
    "reward_max": 17.82487746467814,
    "reward_min": -5.395319755316783,
    "reward_std": 5.888679106966043,
    "timesteps": 636853383,
    "learntime": 0.26304498594254255,
    "sampletime": 8.803433358902112,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1803,
    "reward_mean": 14.351038084135359,
    "reward_max": 18.65845386573346,
    "reward_min": 3.7110886605082523,
    "reward_std": 3.5144346971556395,
    "timesteps": 637212783,
    "learntime": 0.25397634389810264,
    "sampletime": 8.89352754689753,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1804,
    "reward_mean": 13.90610781099063,
    "reward_max": 18.74292364876743,
    "reward_min": -5.464091576533531,
    "reward_std": 3.7157567886486866,
    "timesteps": 637571580,
    "learntime": 0.25766148418188095,
    "sampletime": 8.925003381911665,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1805,
    "reward_mean": 14.472293431566097,
    "reward_max": 18.669790138225917,
    "reward_min": 5.42080051348029,
    "reward_std": 3.0857128571947916,
    "timesteps": 637930239,
    "learntime": 0.2627389319241047,
    "sampletime": 8.964321194915101,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1806,
    "reward_mean": 10.894268163125744,
    "reward_max": 18.374001174527535,
    "reward_min": -4.630452168214659,
    "reward_std": 5.616896630430698,
    "timesteps": 638282772,
    "learntime": 0.2540110789705068,
    "sampletime": 8.79693275410682,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1807,
    "reward_mean": 15.31757233721342,
    "reward_max": 18.572579814392757,
    "reward_min": 5.654988648642424,
    "reward_std": 2.412901925819325,
    "timesteps": 638642364,
    "learntime": 0.2541420559864491,
    "sampletime": 8.996474734973162,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1808,
    "reward_mean": 13.928937549067715,
    "reward_max": 19.153389396374134,
    "reward_min": 2.972584327104302,
    "reward_std": 4.026138653239144,
    "timesteps": 638998893,
    "learntime": 0.2512410068884492,
    "sampletime": 9.062204431043938,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1809,
    "reward_mean": 14.143992754213247,
    "reward_max": 17.924754274630686,
    "reward_min": -3.7087956013415466,
    "reward_std": 3.5007787833638173,
    "timesteps": 639357501,
    "learntime": 0.25050323992036283,
    "sampletime": 9.081407535122707,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1810,
    "reward_mean": 10.622805971706743,
    "reward_max": 18.765413367062465,
    "reward_min": -23.75307901815695,
    "reward_std": 7.387746663497967,
    "timesteps": 639708924,
    "learntime": 0.26267766510136425,
    "sampletime": 8.735003619920462,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1811,
    "reward_mean": 13.577162871507849,
    "reward_max": 18.83298226397936,
    "reward_min": -4.942608700675519,
    "reward_std": 4.907924519181913,
    "timesteps": 640064178,
    "learntime": 0.26433008909225464,
    "sampletime": 8.792134958086535,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1812,
    "reward_mean": 13.69485523161649,
    "reward_max": 20.032134502123334,
    "reward_min": -1.5641041684430084,
    "reward_std": 4.4257492380682955,
    "timesteps": 640422489,
    "learntime": 0.2656359220854938,
    "sampletime": 8.982734529068694,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1813,
    "reward_mean": 15.032738941878485,
    "reward_max": 18.928750745860413,
    "reward_min": 5.218069394584745,
    "reward_std": 2.999940477838189,
    "timesteps": 640781121,
    "learntime": 0.25178333511576056,
    "sampletime": 9.082946249982342,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1814,
    "reward_mean": 14.709406408474285,
    "reward_max": 19.815178804367665,
    "reward_min": -3.8416806155404313,
    "reward_std": 4.128096685722192,
    "timesteps": 641139759,
    "learntime": 0.2614809079095721,
    "sampletime": 9.054213684983552,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1815,
    "reward_mean": 12.402613938907027,
    "reward_max": 18.77539647769916,
    "reward_min": -12.243865210478278,
    "reward_std": 6.926574780415248,
    "timesteps": 641490954,
    "learntime": 0.2582882021088153,
    "sampletime": 8.982800150057301,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1816,
    "reward_mean": 12.918370505610547,
    "reward_max": 19.32853094724741,
    "reward_min": -13.497882717550086,
    "reward_std": 6.7956813862536105,
    "timesteps": 641846205,
    "learntime": 0.26740512414835393,
    "sampletime": 8.784442155156285,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1817,
    "reward_mean": 13.191027154157217,
    "reward_max": 19.63619427504035,
    "reward_min": -11.261250967313323,
    "reward_std": 6.105089233942548,
    "timesteps": 642200694,
    "learntime": 0.25982508808374405,
    "sampletime": 9.020495154894888,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1818,
    "reward_mean": 13.371033364448888,
    "reward_max": 19.596334777384367,
    "reward_min": -6.711913374545418,
    "reward_std": 6.389685408851387,
    "timesteps": 642556005,
    "learntime": 0.25796241010539234,
    "sampletime": 8.933000654913485,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1819,
    "reward_mean": 14.913500017878409,
    "reward_max": 20.45621300849921,
    "reward_min": 3.1030191270816165,
    "reward_std": 4.277413965590786,
    "timesteps": 642913155,
    "learntime": 0.2630514979828149,
    "sampletime": 8.918557439930737,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1820,
    "reward_mean": 13.321192794157607,
    "reward_max": 19.85053014098384,
    "reward_min": -13.523463851772249,
    "reward_std": 5.601581514058702,
    "timesteps": 643267695,
    "learntime": 0.2671332829631865,
    "sampletime": 8.854984959820285,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1821,
    "reward_mean": 15.364710465896229,
    "reward_max": 18.994263726667583,
    "reward_min": 4.821483120294004,
    "reward_std": 3.5390975578816475,
    "timesteps": 643625172,
    "learntime": 0.2550718111451715,
    "sampletime": 9.026536426972598,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1822,
    "reward_mean": 12.741299816792655,
    "reward_max": 19.646319980901247,
    "reward_min": -1.9484060380103427,
    "reward_std": 6.158683839711032,
    "timesteps": 643977558,
    "learntime": 0.2585011508781463,
    "sampletime": 9.150441006058827,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1823,
    "reward_mean": 13.741251463851885,
    "reward_max": 19.98586947995654,
    "reward_min": -9.734968733475808,
    "reward_std": 6.0589836091649385,
    "timesteps": 644332152,
    "learntime": 0.2557089270558208,
    "sampletime": 8.833701444091275,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1824,
    "reward_mean": 14.8868165547905,
    "reward_max": 19.132006581449374,
    "reward_min": 6.4152287564273,
    "reward_std": 4.26078058826622,
    "timesteps": 644688606,
    "learntime": 0.2771513687912375,
    "sampletime": 8.911824600072578,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1825,
    "reward_mean": 13.33313524255156,
    "reward_max": 19.232316147013936,
    "reward_min": -4.43659688257895,
    "reward_std": 5.830112388927556,
    "timesteps": 645043629,
    "learntime": 0.25569770694710314,
    "sampletime": 8.901892584050074,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1826,
    "reward_mean": 11.626868059538335,
    "reward_max": 21.190120281686887,
    "reward_min": -12.352762862858881,
    "reward_std": 8.257903615323471,
    "timesteps": 645393405,
    "learntime": 0.2627585669979453,
    "sampletime": 8.851908517070115,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1827,
    "reward_mean": 14.55432318376999,
    "reward_max": 21.022375753205836,
    "reward_min": -1.993398773469818,
    "reward_std": 5.834672480028712,
    "timesteps": 645748413,
    "learntime": 0.25513910804875195,
    "sampletime": 8.912231439957395,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1828,
    "reward_mean": 12.904720694917803,
    "reward_max": 20.825227920670937,
    "reward_min": -11.397216390423251,
    "reward_std": 6.992815558265729,
    "timesteps": 646099272,
    "learntime": 0.25494990102015436,
    "sampletime": 8.916378538822755,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1829,
    "reward_mean": 15.269920405170156,
    "reward_max": 20.30874783442722,
    "reward_min": -5.979208597913387,
    "reward_std": 5.475127957968724,
    "timesteps": 646455213,
    "learntime": 0.25477937096729875,
    "sampletime": 9.085800595814362,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1830,
    "reward_mean": 12.630551582817384,
    "reward_max": 21.531904478261076,
    "reward_min": -10.696020058663144,
    "reward_std": 8.183002598611742,
    "timesteps": 646805349,
    "learntime": 0.25487601198256016,
    "sampletime": 8.926051707938313,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1831,
    "reward_mean": 16.922788899106756,
    "reward_max": 21.90203709062895,
    "reward_min": 6.881520227555566,
    "reward_std": 4.289060161301801,
    "timesteps": 647163198,
    "learntime": 0.25571555900387466,
    "sampletime": 8.930059406906366,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1832,
    "reward_mean": 14.478008153387877,
    "reward_max": 21.249794365912546,
    "reward_min": -3.01652717609382,
    "reward_std": 5.735927290973243,
    "timesteps": 647517432,
    "learntime": 0.2503512839321047,
    "sampletime": 8.789711529156193,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1833,
    "reward_mean": 14.505311580813284,
    "reward_max": 21.439637546995503,
    "reward_min": -11.450317790370198,
    "reward_std": 7.217373364462608,
    "timesteps": 647872110,
    "learntime": 0.260827454039827,
    "sampletime": 8.835452508879825,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1834,
    "reward_mean": 12.602120495400527,
    "reward_max": 21.267051438497603,
    "reward_min": -10.341457339201233,
    "reward_std": 7.921257968482619,
    "timesteps": 648225369,
    "learntime": 0.25621743011288345,
    "sampletime": 8.927677534054965,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1835,
    "reward_mean": 12.07311128825325,
    "reward_max": 20.899887071735446,
    "reward_min": -29.220189248557404,
    "reward_std": 8.279944107143312,
    "timesteps": 648578892,
    "learntime": 0.26764453295618296,
    "sampletime": 8.978131248848513,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1836,
    "reward_mean": 15.678420558430364,
    "reward_max": 21.96843957533645,
    "reward_min": -1.5308189847220874,
    "reward_std": 6.39656403275006,
    "timesteps": 648933708,
    "learntime": 0.27036123210564256,
    "sampletime": 8.836142278043553,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1837,
    "reward_mean": 11.21261478430141,
    "reward_max": 21.573198258735676,
    "reward_min": -20.101428657747235,
    "reward_std": 9.369790627087106,
    "timesteps": 649282254,
    "learntime": 0.26498112408444285,
    "sampletime": 8.70129071502015,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1838,
    "reward_mean": 13.403225417852854,
    "reward_max": 21.0613878283043,
    "reward_min": -6.8828940614863905,
    "reward_std": 7.310829820909461,
    "timesteps": 649634229,
    "learntime": 0.2524005000013858,
    "sampletime": 8.75564184691757,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1839,
    "reward_mean": 15.039346504475693,
    "reward_max": 22.658980566457924,
    "reward_min": -0.48143210468433073,
    "reward_std": 6.619870922750551,
    "timesteps": 649989291,
    "learntime": 0.25884244008921087,
    "sampletime": 8.763337017036974,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1840,
    "reward_mean": 11.336128241143498,
    "reward_max": 22.321653757179664,
    "reward_min": -21.915131735770654,
    "reward_std": 8.565542182098701,
    "timesteps": 650336241,
    "learntime": 0.2639631840866059,
    "sampletime": 8.678232979029417,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1841,
    "reward_mean": 13.652709410358586,
    "reward_max": 21.5199097188941,
    "reward_min": -20.66528939695634,
    "reward_std": 8.174177622380517,
    "timesteps": 650689305,
    "learntime": 0.2532546760048717,
    "sampletime": 8.924229911062866,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1842,
    "reward_mean": 15.681528295742936,
    "reward_max": 21.951468528530913,
    "reward_min": -1.3844112288277353,
    "reward_std": 6.057116976049265,
    "timesteps": 651044019,
    "learntime": 0.2570322500541806,
    "sampletime": 8.802080598892644,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1843,
    "reward_mean": 13.442678342379592,
    "reward_max": 21.936871236446063,
    "reward_min": -2.2787018649943374,
    "reward_std": 6.7980444741076,
    "timesteps": 651395061,
    "learntime": 0.27312310691922903,
    "sampletime": 8.825201639905572,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1844,
    "reward_mean": 9.975512288104007,
    "reward_max": 21.124809808295325,
    "reward_min": -17.125003571057643,
    "reward_std": 9.145954729162808,
    "timesteps": 651743448,
    "learntime": 0.248320345999673,
    "sampletime": 8.812701697926968,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1845,
    "reward_mean": 11.192786128774223,
    "reward_max": 21.65159956202136,
    "reward_min": -19.1861378054371,
    "reward_std": 10.352927335481693,
    "timesteps": 652092498,
    "learntime": 0.2642818819731474,
    "sampletime": 8.791442279936746,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1846,
    "reward_mean": 13.130834167358428,
    "reward_max": 21.20858887763637,
    "reward_min": -5.184237626956832,
    "reward_std": 7.1849631429386225,
    "timesteps": 652444845,
    "learntime": 0.2533893750514835,
    "sampletime": 8.876246021129191,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1847,
    "reward_mean": 13.723180409666178,
    "reward_max": 20.833318771434616,
    "reward_min": -2.585657179983563,
    "reward_std": 6.494163587292231,
    "timesteps": 652796949,
    "learntime": 0.2769601789768785,
    "sampletime": 8.698966179043055,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1848,
    "reward_mean": 14.821498683465482,
    "reward_max": 20.794476844768116,
    "reward_min": -0.6308444278547604,
    "reward_std": 4.986646518482465,
    "timesteps": 653153232,
    "learntime": 0.26004639198072255,
    "sampletime": 8.930337765952572,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1849,
    "reward_mean": 16.630897136371914,
    "reward_max": 21.024463199384186,
    "reward_min": -4.102062188681554,
    "reward_std": 4.518039069676219,
    "timesteps": 653511366,
    "learntime": 0.2655675371643156,
    "sampletime": 8.90161217795685,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1850,
    "reward_mean": 13.795244274078225,
    "reward_max": 21.531226479164385,
    "reward_min": -13.339373257709669,
    "reward_std": 6.215405955402778,
    "timesteps": 653867934,
    "learntime": 0.2580641619861126,
    "sampletime": 8.967274415073916,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1851,
    "reward_mean": 12.328993619590673,
    "reward_max": 21.848124368156828,
    "reward_min": -4.19741541253064,
    "reward_std": 5.781835817761946,
    "timesteps": 654218688,
    "learntime": 0.256405662978068,
    "sampletime": 8.790258678840473,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1852,
    "reward_mean": 13.425759119335961,
    "reward_max": 19.27153981478433,
    "reward_min": -3.591199347742885,
    "reward_std": 5.268072065761023,
    "timesteps": 654573558,
    "learntime": 0.2559570539742708,
    "sampletime": 8.922386566875502,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1853,
    "reward_mean": 14.53136231189603,
    "reward_max": 19.961221132794332,
    "reward_min": -2.0053368688800988,
    "reward_std": 4.588193684679979,
    "timesteps": 654930144,
    "learntime": 0.25730434292927384,
    "sampletime": 8.959418157115579,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1854,
    "reward_mean": 14.107372425467364,
    "reward_max": 19.43222623664152,
    "reward_min": -3.184612139930122,
    "reward_std": 4.96307248069117,
    "timesteps": 655285953,
    "learntime": 0.2578543259296566,
    "sampletime": 8.872027785982937,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1855,
    "reward_mean": 13.312987522844992,
    "reward_max": 18.58649831938435,
    "reward_min": 3.480066756848387,
    "reward_std": 4.370119963521425,
    "timesteps": 655641444,
    "learntime": 0.27410702500492334,
    "sampletime": 8.841693583875895,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1856,
    "reward_mean": 13.265618708476092,
    "reward_max": 18.88964860043941,
    "reward_min": 3.184986190270686,
    "reward_std": 4.08069791540992,
    "timesteps": 655998525,
    "learntime": 0.2675301830749959,
    "sampletime": 9.023682175204158,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1857,
    "reward_mean": 15.135697070309785,
    "reward_max": 19.849015557397664,
    "reward_min": -0.566606838781757,
    "reward_std": 3.448428255111691,
    "timesteps": 656358102,
    "learntime": 0.25464605283923447,
    "sampletime": 8.967788808047771,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1858,
    "reward_mean": 14.426152517299691,
    "reward_max": 18.750733161506815,
    "reward_min": 3.705667295098076,
    "reward_std": 3.1194550535608734,
    "timesteps": 656717712,
    "learntime": 0.2679730551317334,
    "sampletime": 9.011722438968718,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1859,
    "reward_mean": 13.1323104875988,
    "reward_max": 19.06715318886563,
    "reward_min": -1.6098310625970766,
    "reward_std": 4.5041122589993625,
    "timesteps": 657074406,
    "learntime": 0.260468513937667,
    "sampletime": 8.804217956960201,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1860,
    "reward_mean": 13.924373523062872,
    "reward_max": 19.162878878008943,
    "reward_min": 3.8173161549599475,
    "reward_std": 3.724495959877599,
    "timesteps": 657432534,
    "learntime": 0.2645882489159703,
    "sampletime": 8.94888473302126,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1861,
    "reward_mean": 14.493075493080099,
    "reward_max": 19.377927827247824,
    "reward_min": -0.6352412788352613,
    "reward_std": 3.9251443774411494,
    "timesteps": 657790632,
    "learntime": 0.26991948997601867,
    "sampletime": 8.770606462145224,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1862,
    "reward_mean": 15.714288591813546,
    "reward_max": 18.608359400218237,
    "reward_min": 10.323394089282369,
    "reward_std": 1.5957662604236709,
    "timesteps": 658151352,
    "learntime": 0.26029446884058416,
    "sampletime": 8.94664626615122,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1863,
    "reward_mean": 13.70686282302121,
    "reward_max": 19.2684422702331,
    "reward_min": -2.7493679962224484,
    "reward_std": 5.021986214277554,
    "timesteps": 658506264,
    "learntime": 0.26553674996830523,
    "sampletime": 8.810413728002459,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1864,
    "reward_mean": 14.761841815419437,
    "reward_max": 20.05294305524633,
    "reward_min": -5.696747019195535,
    "reward_std": 4.406724141250082,
    "timesteps": 658863771,
    "learntime": 0.2554806990083307,
    "sampletime": 8.800323511939496,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1865,
    "reward_mean": 13.913626509819242,
    "reward_max": 18.90710538445097,
    "reward_min": 1.6312101205641574,
    "reward_std": 4.486424650562465,
    "timesteps": 659220111,
    "learntime": 0.2652294731233269,
    "sampletime": 9.045126625103876,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1866,
    "reward_mean": 12.54926467168688,
    "reward_max": 20.535055202745948,
    "reward_min": -15.305373752962398,
    "reward_std": 7.692896308580928,
    "timesteps": 659571423,
    "learntime": 0.2612882119137794,
    "sampletime": 8.763521327869967,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1867,
    "reward_mean": 13.732790168597708,
    "reward_max": 21.22020363276048,
    "reward_min": -3.417277700036449,
    "reward_std": 4.989159438775538,
    "timesteps": 659927238,
    "learntime": 0.2773082999046892,
    "sampletime": 8.81665381602943,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1868,
    "reward_mean": 12.762995762713395,
    "reward_max": 20.81923643708454,
    "reward_min": -13.239255590505449,
    "reward_std": 6.576878160013543,
    "timesteps": 660280896,
    "learntime": 0.26102085784077644,
    "sampletime": 8.936942111933604,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1869,
    "reward_mean": 12.098489761555394,
    "reward_max": 21.790580768320723,
    "reward_min": -20.799852101231053,
    "reward_std": 9.69685915653849,
    "timesteps": 660632730,
    "learntime": 0.26480547711253166,
    "sampletime": 8.81786495889537,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1870,
    "reward_mean": 11.227173770886555,
    "reward_max": 21.99762194062879,
    "reward_min": -11.419337757030563,
    "reward_std": 7.722180769995926,
    "timesteps": 660982863,
    "learntime": 0.2825780638959259,
    "sampletime": 8.768047024961561,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1871,
    "reward_mean": 11.313164352396491,
    "reward_max": 19.797495840406608,
    "reward_min": -14.256498557046257,
    "reward_std": 8.254718035525787,
    "timesteps": 661333761,
    "learntime": 0.26428682007826865,
    "sampletime": 8.734293747926131,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1872,
    "reward_mean": 4.991367248806058,
    "reward_max": 20.905580287333574,
    "reward_min": -35.90432151633488,
    "reward_std": 11.889149721229904,
    "timesteps": 661672191,
    "learntime": 0.266113996040076,
    "sampletime": 8.617768769850954,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1873,
    "reward_mean": 11.03544900204097,
    "reward_max": 21.88138753096831,
    "reward_min": -19.558810204532676,
    "reward_std": 9.241395920041196,
    "timesteps": 662023743,
    "learntime": 0.2652606649789959,
    "sampletime": 8.692732673836872,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1874,
    "reward_mean": 8.958324181716431,
    "reward_max": 20.29930012751073,
    "reward_min": -14.74381398803301,
    "reward_std": 9.580727253403742,
    "timesteps": 662372505,
    "learntime": 0.26270454889163375,
    "sampletime": 8.708908146014437,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1875,
    "reward_mean": 13.28265173568403,
    "reward_max": 20.286868388101347,
    "reward_min": -13.681223290238647,
    "reward_std": 7.683012715632202,
    "timesteps": 662725512,
    "learntime": 0.2601854889653623,
    "sampletime": 8.83975541498512,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1876,
    "reward_mean": 8.435685786139576,
    "reward_max": 21.351325938710946,
    "reward_min": -52.78775107702522,
    "reward_std": 12.20454498314603,
    "timesteps": 663072366,
    "learntime": 0.2549438651185483,
    "sampletime": 8.68213894404471,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1877,
    "reward_mean": 9.829942810330502,
    "reward_max": 20.30204492227171,
    "reward_min": -23.25246764045909,
    "reward_std": 10.05872008372598,
    "timesteps": 663421488,
    "learntime": 0.256343588931486,
    "sampletime": 8.742565588094294,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1878,
    "reward_mean": 10.111935552154103,
    "reward_max": 20.452594173774635,
    "reward_min": -11.121913876966131,
    "reward_std": 7.435916532894967,
    "timesteps": 663771348,
    "learntime": 0.2619805717840791,
    "sampletime": 8.80177867715247,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1879,
    "reward_mean": 8.959084514883623,
    "reward_max": 18.891812084768322,
    "reward_min": -14.897947947656963,
    "reward_std": 8.27180347151534,
    "timesteps": 664121769,
    "learntime": 0.26634376402944326,
    "sampletime": 8.755032679997385,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1880,
    "reward_mean": 11.462743076762294,
    "reward_max": 18.78960830324936,
    "reward_min": -6.100636911908873,
    "reward_std": 5.570714430476017,
    "timesteps": 664475379,
    "learntime": 0.267984600039199,
    "sampletime": 8.847238471033052,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1881,
    "reward_mean": 14.057512114773308,
    "reward_max": 18.640251313145694,
    "reward_min": -0.7003370408801314,
    "reward_std": 3.908664657849474,
    "timesteps": 664834230,
    "learntime": 0.2713028620928526,
    "sampletime": 8.90620745997876,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1882,
    "reward_mean": 11.701444053953498,
    "reward_max": 19.183516529660363,
    "reward_min": -4.493793700102043,
    "reward_std": 5.132165436552286,
    "timesteps": 665190096,
    "learntime": 0.25666163209825754,
    "sampletime": 8.890507317846641,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1883,
    "reward_mean": 12.460984743305907,
    "reward_max": 18.935535711100474,
    "reward_min": -21.101106247046232,
    "reward_std": 6.043694834483905,
    "timesteps": 665546694,
    "learntime": 0.2725219640415162,
    "sampletime": 8.721425607101992,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1884,
    "reward_mean": 9.762762658798085,
    "reward_max": 15.587217938225486,
    "reward_min": -12.691855926743296,
    "reward_std": 5.320464277102446,
    "timesteps": 665902740,
    "learntime": 0.26485726004466414,
    "sampletime": 8.830709664151073,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1885,
    "reward_mean": 11.874990041056895,
    "reward_max": 16.117102250837803,
    "reward_min": -2.7285545616113147,
    "reward_std": 3.837296053047529,
    "timesteps": 666261912,
    "learntime": 0.2629511822015047,
    "sampletime": 8.791440102038905,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1886,
    "reward_mean": 10.369201218001425,
    "reward_max": 15.70837448056166,
    "reward_min": -5.2248633594612,
    "reward_std": 4.57635955123276,
    "timesteps": 666620007,
    "learntime": 0.2645008768886328,
    "sampletime": 8.870921421097592,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1887,
    "reward_mean": 11.484447807107644,
    "reward_max": 15.71618866770895,
    "reward_min": 1.1841140735301736,
    "reward_std": 2.5565569777719537,
    "timesteps": 666979722,
    "learntime": 0.26978249195963144,
    "sampletime": 9.110841991845518,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1888,
    "reward_mean": 8.867812038179409,
    "reward_max": 15.841985089678523,
    "reward_min": -9.561591574936314,
    "reward_std": 4.830629722230312,
    "timesteps": 667334994,
    "learntime": 0.2646445098798722,
    "sampletime": 8.808255634037778,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1889,
    "reward_mean": 9.826123108322866,
    "reward_max": 14.177596579633907,
    "reward_min": 0.00041576090293479496,
    "reward_std": 3.085386854740151,
    "timesteps": 667693737,
    "learntime": 0.25987528706900775,
    "sampletime": 8.912468733964488,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1890,
    "reward_mean": 8.703603413687883,
    "reward_max": 13.445466560530338,
    "reward_min": -8.759659659337357,
    "reward_std": 3.3535949155983276,
    "timesteps": 668052123,
    "learntime": 0.26681857206858695,
    "sampletime": 8.840449061011896,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1891,
    "reward_mean": 8.97411856634436,
    "reward_max": 12.553492072616898,
    "reward_min": -0.5272934122829471,
    "reward_std": 2.7971998714562027,
    "timesteps": 668411562,
    "learntime": 0.2780419969931245,
    "sampletime": 8.921712666982785,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1892,
    "reward_mean": 9.666275345087165,
    "reward_max": 13.22436256055141,
    "reward_min": 6.244601919647362,
    "reward_std": 1.5715489037669406,
    "timesteps": 668772282,
    "learntime": 0.263952154899016,
    "sampletime": 8.671677395002916,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1893,
    "reward_mean": 6.806502043738111,
    "reward_max": 11.382357891790118,
    "reward_min": -7.287665359220807,
    "reward_std": 3.998236075446216,
    "timesteps": 669128529,
    "learntime": 0.2580641130916774,
    "sampletime": 8.862836430082098,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1894,
    "reward_mean": 7.822156836911759,
    "reward_max": 11.203603356792657,
    "reward_min": -8.657017872391874,
    "reward_std": 3.3341069757815838,
    "timesteps": 669487200,
    "learntime": 0.25974219711497426,
    "sampletime": 8.98415633616969,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1895,
    "reward_mean": 9.388040319973785,
    "reward_max": 14.2924041741838,
    "reward_min": 6.394607594122078,
    "reward_std": 1.4891692781174841,
    "timesteps": 669847920,
    "learntime": 0.26505269785411656,
    "sampletime": 8.871194361010566,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1896,
    "reward_mean": 7.117321854528076,
    "reward_max": 14.257439901823863,
    "reward_min": -18.20186072149822,
    "reward_std": 6.254992405264619,
    "timesteps": 670203342,
    "learntime": 0.26558953104540706,
    "sampletime": 8.952223521191627,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1897,
    "reward_mean": 8.374617819263097,
    "reward_max": 12.899127722387535,
    "reward_min": -9.71968994256476,
    "reward_std": 4.1629791875929865,
    "timesteps": 670560879,
    "learntime": 0.26704482710920274,
    "sampletime": 8.828940626000986,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1898,
    "reward_mean": 8.017217605363111,
    "reward_max": 12.3212066988115,
    "reward_min": -2.096939847450952,
    "reward_std": 3.39163063169094,
    "timesteps": 670919166,
    "learntime": 0.26453896099701524,
    "sampletime": 8.811254428932443,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1899,
    "reward_mean": 7.166847430457857,
    "reward_max": 12.319563284834713,
    "reward_min": -9.897577281605642,
    "reward_std": 4.434813181875189,
    "timesteps": 671275440,
    "learntime": 0.26107652904465795,
    "sampletime": 8.85576901002787,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1900,
    "reward_mean": 8.598302555787818,
    "reward_max": 12.62041573255688,
    "reward_min": -1.23488643014747,
    "reward_std": 3.2519359961174223,
    "timesteps": 671633814,
    "learntime": 0.27587022609077394,
    "sampletime": 8.93509484315291,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1901,
    "reward_mean": 9.006963597292092,
    "reward_max": 12.000561542315863,
    "reward_min": -0.4020403443701673,
    "reward_std": 2.3099245818052396,
    "timesteps": 671993547,
    "learntime": 0.26226049195975065,
    "sampletime": 9.00351445400156,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1902,
    "reward_mean": 9.18213785445871,
    "reward_max": 13.598569414904992,
    "reward_min": -1.0543640164427357,
    "reward_std": 3.851547470319756,
    "timesteps": 672350787,
    "learntime": 0.26588023896329105,
    "sampletime": 8.841204266063869,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1903,
    "reward_mean": 9.519623622803582,
    "reward_max": 12.765760472694332,
    "reward_min": -2.834253210965973,
    "reward_std": 2.6646688136323533,
    "timesteps": 672710487,
    "learntime": 0.2530052219517529,
    "sampletime": 8.936573883984238,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1904,
    "reward_mean": 10.31856105803454,
    "reward_max": 14.79286822128779,
    "reward_min": 7.309856337964337,
    "reward_std": 1.529497556183517,
    "timesteps": 673071207,
    "learntime": 0.25878254091367126,
    "sampletime": 9.031090554082766,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1905,
    "reward_mean": 10.311443568796424,
    "reward_max": 14.650020063064535,
    "reward_min": -15.709991873804645,
    "reward_std": 4.361535659346858,
    "timesteps": 673429587,
    "learntime": 0.2616854808293283,
    "sampletime": 8.944075790932402,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1906,
    "reward_mean": 9.595514515562543,
    "reward_max": 14.74060526392229,
    "reward_min": -0.49584178907345483,
    "reward_std": 4.168618609844233,
    "timesteps": 673784466,
    "learntime": 0.268604741897434,
    "sampletime": 8.732403710018843,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1907,
    "reward_mean": 10.946057478845365,
    "reward_max": 14.615142307405632,
    "reward_min": 1.6069889156175117,
    "reward_std": 3.2899088734257775,
    "timesteps": 674142750,
    "learntime": 0.25965518108569086,
    "sampletime": 8.896292241057381,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1908,
    "reward_mean": 11.280305213362192,
    "reward_max": 16.862310301699452,
    "reward_min": 1.9063332720543285,
    "reward_std": 3.8642534499998513,
    "timesteps": 674500062,
    "learntime": 0.2499531670473516,
    "sampletime": 8.957438607001677,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1909,
    "reward_mean": 10.099235090718059,
    "reward_max": 16.212983175343126,
    "reward_min": -7.4971145765404374,
    "reward_std": 6.02157782366755,
    "timesteps": 674854464,
    "learntime": 0.26153453695587814,
    "sampletime": 8.801830694079399,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1910,
    "reward_mean": 9.5434182011672,
    "reward_max": 16.494522675299475,
    "reward_min": -11.544161634632585,
    "reward_std": 6.371114024120305,
    "timesteps": 675210372,
    "learntime": 0.26576187391765416,
    "sampletime": 8.779460957972333,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1911,
    "reward_mean": 4.773700729806977,
    "reward_max": 17.191003672626913,
    "reward_min": -23.80052935189539,
    "reward_std": 10.490345359655995,
    "timesteps": 675556260,
    "learntime": 0.25907229306176305,
    "sampletime": 8.760045279050246,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1912,
    "reward_mean": 5.7493867536724395,
    "reward_max": 16.73395261790508,
    "reward_min": -28.528427779362673,
    "reward_std": 9.037185559059337,
    "timesteps": 675903690,
    "learntime": 0.2625177351292223,
    "sampletime": 8.688901244895533,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1913,
    "reward_mean": 3.1801518387055583,
    "reward_max": 17.067239784550935,
    "reward_min": -33.28839309024163,
    "reward_std": 11.655471586311993,
    "timesteps": 676246182,
    "learntime": 0.2928023349959403,
    "sampletime": 8.689210259122774,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1914,
    "reward_mean": -1.6756970782872735,
    "reward_max": 19.20245893331682,
    "reward_min": -33.22856371434208,
    "reward_std": 12.95361996393855,
    "timesteps": 676577961,
    "learntime": 0.2812948441132903,
    "sampletime": 8.40452244412154,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1915,
    "reward_mean": -1.8829287596378612,
    "reward_max": 17.29380201843962,
    "reward_min": -28.078082888619978,
    "reward_std": 11.713908034063053,
    "timesteps": 676911300,
    "learntime": 0.2685131800826639,
    "sampletime": 8.485559838125482,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1916,
    "reward_mean": -2.3500805671930536,
    "reward_max": 16.170181723297432,
    "reward_min": -53.33215136850733,
    "reward_std": 13.560250592996379,
    "timesteps": 677244078,
    "learntime": 0.26427960814908147,
    "sampletime": 8.41191035299562,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1917,
    "reward_mean": 4.394132489193305,
    "reward_max": 18.016873501269426,
    "reward_min": -28.770675591167272,
    "reward_std": 10.456320175067388,
    "timesteps": 677584800,
    "learntime": 0.26610611798241735,
    "sampletime": 8.683506755158305,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1918,
    "reward_mean": 0.45372590922137707,
    "reward_max": 17.586733459200435,
    "reward_min": -34.33303690237473,
    "reward_std": 12.616255003062477,
    "timesteps": 677920263,
    "learntime": 0.2618417290505022,
    "sampletime": 8.587631832109764,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1919,
    "reward_mean": 3.2586852724060504,
    "reward_max": 16.346670752672996,
    "reward_min": -41.88798325202626,
    "reward_std": 11.560387433832659,
    "timesteps": 678267354,
    "learntime": 0.26188322994858027,
    "sampletime": 8.685275926953182,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1920,
    "reward_mean": 6.459106153264228,
    "reward_max": 16.632230535078424,
    "reward_min": -24.188977307784658,
    "reward_std": 8.863338327069904,
    "timesteps": 678616374,
    "learntime": 0.2719175270758569,
    "sampletime": 8.729548861039802,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1921,
    "reward_mean": 9.103872368634988,
    "reward_max": 15.118881350991698,
    "reward_min": -12.802355902523477,
    "reward_std": 6.598720498702613,
    "timesteps": 678972282,
    "learntime": 0.2707858260255307,
    "sampletime": 8.793496391968802,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1922,
    "reward_mean": 11.121162455547637,
    "reward_max": 16.505129647315087,
    "reward_min": -7.154951613273528,
    "reward_std": 4.916821753805185,
    "timesteps": 679328793,
    "learntime": 0.26686019101180136,
    "sampletime": 8.936165446881205,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1923,
    "reward_mean": 12.039916335235038,
    "reward_max": 15.260012867136131,
    "reward_min": 1.7946656414335849,
    "reward_std": 2.384702522151208,
    "timesteps": 679688592,
    "learntime": 0.28626848198473454,
    "sampletime": 8.94036343600601,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1924,
    "reward_mean": 11.959171360583868,
    "reward_max": 14.145643718371332,
    "reward_min": 8.760211571585385,
    "reward_std": 1.1623028127547597,
    "timesteps": 680049312,
    "learntime": 0.2544694731477648,
    "sampletime": 8.935379215050489,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1925,
    "reward_mean": 11.257284159897813,
    "reward_max": 15.206319384319203,
    "reward_min": 0.37853496602143416,
    "reward_std": 2.2508374460038345,
    "timesteps": 680408796,
    "learntime": 0.27476408798247576,
    "sampletime": 8.896866142982617,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1926,
    "reward_mean": 11.09869606634348,
    "reward_max": 15.340684577364078,
    "reward_min": 7.979195426075332,
    "reward_std": 1.2344110356120692,
    "timesteps": 680769516,
    "learntime": 0.2719998541288078,
    "sampletime": 8.860035796184093,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1927,
    "reward_mean": 10.245363027095372,
    "reward_max": 13.145726478727404,
    "reward_min": 7.977708260098651,
    "reward_std": 1.085016528303436,
    "timesteps": 681130236,
    "learntime": 0.26369730313308537,
    "sampletime": 9.082895067986101,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1928,
    "reward_mean": 11.088628707488857,
    "reward_max": 13.249900341996126,
    "reward_min": 8.368168967151588,
    "reward_std": 1.0039856387398283,
    "timesteps": 681490956,
    "learntime": 0.2668221010826528,
    "sampletime": 9.071352193830535,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1929,
    "reward_mean": 9.884097205440277,
    "reward_max": 12.587354908703778,
    "reward_min": 0.29209643747890196,
    "reward_std": 2.4002520278526673,
    "timesteps": 681850512,
    "learntime": 0.27307050419040024,
    "sampletime": 8.924171312013641,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1930,
    "reward_mean": 10.608640841367137,
    "reward_max": 13.626993501019156,
    "reward_min": 8.841575124371568,
    "reward_std": 1.1103183188919883,
    "timesteps": 682211232,
    "learntime": 0.2818999388255179,
    "sampletime": 8.926635772921145,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1931,
    "reward_mean": 10.759816665195576,
    "reward_max": 13.671312532486445,
    "reward_min": 7.832470302212499,
    "reward_std": 1.2234207289596815,
    "timesteps": 682571952,
    "learntime": 0.2646801099181175,
    "sampletime": 9.043156069004908,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1932,
    "reward_mean": 9.45245349975104,
    "reward_max": 13.962699956186533,
    "reward_min": -7.8927375013290995,
    "reward_std": 4.473928613448042,
    "timesteps": 682930524,
    "learntime": 0.2689897718373686,
    "sampletime": 9.04353913012892,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1933,
    "reward_mean": 11.025913581682065,
    "reward_max": 13.821881584429788,
    "reward_min": 1.9621135240239553,
    "reward_std": 2.1779767517024915,
    "timesteps": 683290083,
    "learntime": 0.2650593281723559,
    "sampletime": 8.91515417699702,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1934,
    "reward_mean": 10.669348043896083,
    "reward_max": 14.359056588770313,
    "reward_min": -7.079042054557551,
    "reward_std": 3.5265986284652016,
    "timesteps": 683648400,
    "learntime": 0.27252136706374586,
    "sampletime": 8.966162608936429,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1935,
    "reward_mean": 10.976135459413879,
    "reward_max": 14.794214167434903,
    "reward_min": 2.1673721593785262,
    "reward_std": 2.7914377161562562,
    "timesteps": 684007044,
    "learntime": 0.2572334238793701,
    "sampletime": 9.082269056001678,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1936,
    "reward_mean": 12.60456108643891,
    "reward_max": 15.031470257014558,
    "reward_min": 10.412790814509869,
    "reward_std": 1.1492683411416886,
    "timesteps": 684367764,
    "learntime": 0.2654240701813251,
    "sampletime": 8.963144445093349,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1937,
    "reward_mean": 11.585493299726124,
    "reward_max": 15.755904807698569,
    "reward_min": 1.1679197831615544,
    "reward_std": 3.5456751315954986,
    "timesteps": 684725793,
    "learntime": 0.32392670889385045,
    "sampletime": 8.846425045048818,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1938,
    "reward_mean": 10.563917177702672,
    "reward_max": 16.26554147802138,
    "reward_min": -6.475236457779607,
    "reward_std": 5.217801699272797,
    "timesteps": 685084233,
    "learntime": 0.26281603099778295,
    "sampletime": 8.96792014199309,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1939,
    "reward_mean": 11.033812773490872,
    "reward_max": 16.388308989603754,
    "reward_min": -14.668772658674492,
    "reward_std": 5.957267494578433,
    "timesteps": 685441137,
    "learntime": 0.32477989699691534,
    "sampletime": 9.04222089285031,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1940,
    "reward_mean": 10.376574539762029,
    "reward_max": 17.316410040849757,
    "reward_min": -16.052376175486252,
    "reward_std": 7.478165963369855,
    "timesteps": 685798269,
    "learntime": 0.2774147598538548,
    "sampletime": 8.920850976137444,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1941,
    "reward_mean": 10.729822106135245,
    "reward_max": 16.61332596493417,
    "reward_min": -22.04507286817358,
    "reward_std": 6.789727619410243,
    "timesteps": 686153694,
    "learntime": 0.3242815379053354,
    "sampletime": 8.95370872109197,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1942,
    "reward_mean": 11.13214917809823,
    "reward_max": 19.06062825528065,
    "reward_min": -4.335771853073367,
    "reward_std": 5.5496723965301635,
    "timesteps": 686510733,
    "learntime": 0.26783418096601963,
    "sampletime": 9.010803111130372,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1943,
    "reward_mean": 3.2649296319178918,
    "reward_max": 18.825158454585388,
    "reward_min": -23.358564859679475,
    "reward_std": 10.436818449181105,
    "timesteps": 686860062,
    "learntime": 0.32472687982954085,
    "sampletime": 8.764989434042946,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1944,
    "reward_mean": 4.50441130973922,
    "reward_max": 19.338945219487258,
    "reward_min": -22.905657589125134,
    "reward_std": 10.455014648327271,
    "timesteps": 687214983,
    "learntime": 0.26772199501283467,
    "sampletime": 8.81541019002907,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1945,
    "reward_mean": 4.099574546791411,
    "reward_max": 19.367124495421493,
    "reward_min": -33.60938715881837,
    "reward_std": 11.488272895022025,
    "timesteps": 687568137,
    "learntime": 0.3172540180385113,
    "sampletime": 8.759266417007893,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1946,
    "reward_mean": 0.21295606729290273,
    "reward_max": 19.19747010601515,
    "reward_min": -37.04745941246317,
    "reward_std": 13.5487071434778,
    "timesteps": 687918522,
    "learntime": 0.2627405091188848,
    "sampletime": 8.790256894892082,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1947,
    "reward_mean": 1.9877005551656635,
    "reward_max": 19.300470619935144,
    "reward_min": -30.08262781778379,
    "reward_std": 10.530279417797772,
    "timesteps": 688263825,
    "learntime": 0.3259720280766487,
    "sampletime": 8.629266623174772,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1948,
    "reward_mean": 4.339610745006676,
    "reward_max": 19.425190208428024,
    "reward_min": -23.408477867725058,
    "reward_std": 10.786068667138887,
    "timesteps": 688614474,
    "learntime": 0.26055143401026726,
    "sampletime": 8.754435358103365,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1949,
    "reward_mean": -0.7307540340966141,
    "reward_max": 20.509012564878937,
    "reward_min": -22.633179412209298,
    "reward_std": 12.26836178485482,
    "timesteps": 688960074,
    "learntime": 0.3155944331083447,
    "sampletime": 8.809383700136095,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1950,
    "reward_mean": -2.0544261482288375,
    "reward_max": 18.937258153345308,
    "reward_min": -31.558608500020593,
    "reward_std": 13.21731620032848,
    "timesteps": 689304252,
    "learntime": 0.27379053202457726,
    "sampletime": 8.749702214961872,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1951,
    "reward_mean": 0.4124983430643193,
    "reward_max": 19.103577570212813,
    "reward_min": -29.57540830611039,
    "reward_std": 10.846560653126208,
    "timesteps": 689654586,
    "learntime": 0.3139630160294473,
    "sampletime": 8.74623625795357,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1952,
    "reward_mean": 2.092071725289784,
    "reward_max": 19.138175415744218,
    "reward_min": -40.75877026066001,
    "reward_std": 13.042515133613946,
    "timesteps": 690002505,
    "learntime": 0.2655518699903041,
    "sampletime": 8.62599076796323,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1953,
    "reward_mean": 1.9900947408970804,
    "reward_max": 19.14891799029923,
    "reward_min": -41.98985352384096,
    "reward_std": 11.915928626414791,
    "timesteps": 690353547,
    "learntime": 0.3124927810858935,
    "sampletime": 8.98035497800447,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1954,
    "reward_mean": -2.633862263824419,
    "reward_max": 18.63773128082495,
    "reward_min": -42.93411330417307,
    "reward_std": 14.02330312696553,
    "timesteps": 690699654,
    "learntime": 0.2643941598944366,
    "sampletime": 8.759914666879922,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1955,
    "reward_mean": -2.137760208082705,
    "reward_max": 19.063446769891822,
    "reward_min": -29.610336193983766,
    "reward_std": 12.412212121753937,
    "timesteps": 691048323,
    "learntime": 0.32742865406908095,
    "sampletime": 8.7447735669557,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1956,
    "reward_mean": 4.495728923301835,
    "reward_max": 18.256526455175564,
    "reward_min": -21.54742944420485,
    "reward_std": 10.43896763232337,
    "timesteps": 691403250,
    "learntime": 0.26706261397339404,
    "sampletime": 8.854105073027313,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1957,
    "reward_mean": 3.9923754972412118,
    "reward_max": 18.55813764283349,
    "reward_min": -28.695502688315884,
    "reward_std": 11.669831460230697,
    "timesteps": 691757148,
    "learntime": 0.32889310899190605,
    "sampletime": 8.946752620860934,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1958,
    "reward_mean": 8.751338697544622,
    "reward_max": 18.97748401737772,
    "reward_min": -20.031598775733276,
    "reward_std": 8.794148378122618,
    "timesteps": 692114058,
    "learntime": 0.27459065010771155,
    "sampletime": 8.900467045139521,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1959,
    "reward_mean": 9.58942095029737,
    "reward_max": 18.00332617718694,
    "reward_min": -13.259848841047859,
    "reward_std": 7.960800304649251,
    "timesteps": 692468409,
    "learntime": 0.31838890304788947,
    "sampletime": 8.873604667838663,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1960,
    "reward_mean": 10.449493620332042,
    "reward_max": 18.140094109448697,
    "reward_min": -5.907188032429215,
    "reward_std": 7.245925092862046,
    "timesteps": 692824281,
    "learntime": 0.2692757558543235,
    "sampletime": 9.12678014091216,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1961,
    "reward_mean": 10.432425388655869,
    "reward_max": 17.05177071112187,
    "reward_min": -4.771742136244106,
    "reward_std": 5.928298169939733,
    "timesteps": 693179277,
    "learntime": 0.3157723050098866,
    "sampletime": 8.972904955036938,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1962,
    "reward_mean": 11.302891763286402,
    "reward_max": 17.099221853186574,
    "reward_min": -17.560311922648303,
    "reward_std": 6.01727246280528,
    "timesteps": 693533520,
    "learntime": 0.2718235841020942,
    "sampletime": 8.928693035850301,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1963,
    "reward_mean": 11.870031626158362,
    "reward_max": 16.36305256690265,
    "reward_min": -4.792468085616949,
    "reward_std": 4.767522711232847,
    "timesteps": 693890298,
    "learntime": 0.3211387430783361,
    "sampletime": 8.911873318022117,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1964,
    "reward_mean": 7.478999622101308,
    "reward_max": 15.710397964865534,
    "reward_min": -7.230601023699188,
    "reward_std": 7.039925826954416,
    "timesteps": 694239399,
    "learntime": 0.26297588599845767,
    "sampletime": 8.807107285130769,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1965,
    "reward_mean": 10.402721520558195,
    "reward_max": 15.81433187037967,
    "reward_min": -7.778449793572003,
    "reward_std": 5.626166311776512,
    "timesteps": 694593438,
    "learntime": 0.26668298803269863,
    "sampletime": 8.796095608035102,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1966,
    "reward_mean": 11.390163499575788,
    "reward_max": 15.611512729601763,
    "reward_min": -7.3821113258988325,
    "reward_std": 4.484453882275838,
    "timesteps": 694949988,
    "learntime": 0.27178124990314245,
    "sampletime": 8.91462956694886,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1967,
    "reward_mean": 10.085055411065088,
    "reward_max": 15.28072393742287,
    "reward_min": -6.934044239661582,
    "reward_std": 4.774299378356349,
    "timesteps": 695305047,
    "learntime": 0.2617876010481268,
    "sampletime": 8.96866778912954,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1968,
    "reward_mean": 9.947953351951217,
    "reward_max": 14.77940687251329,
    "reward_min": -8.138389005071737,
    "reward_std": 4.9591083232398,
    "timesteps": 695660355,
    "learntime": 0.301792104030028,
    "sampletime": 8.885511549888179,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1969,
    "reward_mean": 8.029669978767352,
    "reward_max": 13.828309490874581,
    "reward_min": -16.976811516048407,
    "reward_std": 6.113085861005013,
    "timesteps": 696013491,
    "learntime": 0.26290700607933104,
    "sampletime": 8.821779103018343,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1970,
    "reward_mean": 9.968079525151259,
    "reward_max": 14.50002834392635,
    "reward_min": -9.080532556731312,
    "reward_std": 4.5034704345231,
    "timesteps": 696369858,
    "learntime": 0.3114573219791055,
    "sampletime": 8.918144804891199,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1971,
    "reward_mean": 9.686873949979127,
    "reward_max": 13.19509364323863,
    "reward_min": -8.772140348983212,
    "reward_std": 4.162093246759614,
    "timesteps": 696727470,
    "learntime": 0.2713594960514456,
    "sampletime": 8.91557454993017,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1972,
    "reward_mean": 7.885233012481317,
    "reward_max": 11.996332794836865,
    "reward_min": -9.325379063848011,
    "reward_std": 4.853816487045278,
    "timesteps": 697083120,
    "learntime": 0.3091444841120392,
    "sampletime": 8.88641595817171,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1973,
    "reward_mean": 7.512105118536777,
    "reward_max": 12.274321972919893,
    "reward_min": -9.159536639997514,
    "reward_std": 5.603575381836538,
    "timesteps": 697436466,
    "learntime": 0.2691381280310452,
    "sampletime": 8.82128537283279,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1974,
    "reward_mean": 7.133901090514522,
    "reward_max": 12.125364237182744,
    "reward_min": -17.51974598883306,
    "reward_std": 5.552888363311777,
    "timesteps": 697790181,
    "learntime": 0.33705627592280507,
    "sampletime": 8.964817652013153,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1975,
    "reward_mean": 9.158815622947843,
    "reward_max": 12.340142335831786,
    "reward_min": -9.399253208528867,
    "reward_std": 3.3410004970509513,
    "timesteps": 698148852,
    "learntime": 0.27717498899437487,
    "sampletime": 8.991889101918787,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1976,
    "reward_mean": 9.15076409566329,
    "reward_max": 11.973287974167356,
    "reward_min": -0.35316129161786,
    "reward_std": 2.973855952806069,
    "timesteps": 698507985,
    "learntime": 0.29149450408294797,
    "sampletime": 8.938324197893962,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1977,
    "reward_mean": 8.213060502184655,
    "reward_max": 11.437182445266059,
    "reward_min": -11.073869054346828,
    "reward_std": 3.860992559857419,
    "timesteps": 698865450,
    "learntime": 0.2678839189466089,
    "sampletime": 8.894425776787102,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1978,
    "reward_mean": 7.813028211011578,
    "reward_max": 11.866830973547291,
    "reward_min": -7.102717634939563,
    "reward_std": 4.162275727905757,
    "timesteps": 699221046,
    "learntime": 0.29993986315093935,
    "sampletime": 8.92495142784901,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1979,
    "reward_mean": 7.737073745022018,
    "reward_max": 11.605438594615405,
    "reward_min": -9.694914238735551,
    "reward_std": 4.243801831136299,
    "timesteps": 699577689,
    "learntime": 0.2640355278272182,
    "sampletime": 8.970303046982735,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1980,
    "reward_mean": 7.672466735634299,
    "reward_max": 11.872006924863348,
    "reward_min": -9.247510356175944,
    "reward_std": 4.283370095722912,
    "timesteps": 699935001,
    "learntime": 0.3314516548998654,
    "sampletime": 8.79274547402747,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1981,
    "reward_mean": 8.826247359579124,
    "reward_max": 11.466667948497077,
    "reward_min": -1.0424624864280148,
    "reward_std": 2.2690260690849,
    "timesteps": 700294746,
    "learntime": 0.2647762300912291,
    "sampletime": 8.969026102917269,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1982,
    "reward_mean": 7.260024728481333,
    "reward_max": 12.23194406489104,
    "reward_min": -19.259057058871615,
    "reward_std": 5.256497957365767,
    "timesteps": 700649958,
    "learntime": 0.34211699292063713,
    "sampletime": 8.889278857037425,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1983,
    "reward_mean": 7.2295294258822524,
    "reward_max": 11.680804302767177,
    "reward_min": -7.859102446841263,
    "reward_std": 4.408933713709129,
    "timesteps": 701005494,
    "learntime": 0.2714248748961836,
    "sampletime": 8.857444510096684,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1984,
    "reward_mean": 6.016785467045454,
    "reward_max": 10.85687081508028,
    "reward_min": -9.850215892473265,
    "reward_std": 5.4880544334931525,
    "timesteps": 701357448,
    "learntime": 0.316067298874259,
    "sampletime": 8.911313895136118,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1985,
    "reward_mean": 4.870918823003105,
    "reward_max": 12.310124868244834,
    "reward_min": -17.49436799248162,
    "reward_std": 7.0390304437965305,
    "timesteps": 701706549,
    "learntime": 0.2830290438141674,
    "sampletime": 8.774065941106528,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1986,
    "reward_mean": 3.598209571154172,
    "reward_max": 11.097448506745309,
    "reward_min": -20.186021640134808,
    "reward_std": 8.224404475667214,
    "timesteps": 702052935,
    "learntime": 0.3292869001161307,
    "sampletime": 8.629088422982022,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1987,
    "reward_mean": 1.9902314159000665,
    "reward_max": 11.974883906892495,
    "reward_min": -19.13258680850832,
    "reward_std": 8.030682815981631,
    "timesteps": 702394017,
    "learntime": 0.26827691006474197,
    "sampletime": 8.663096746895462,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1988,
    "reward_mean": 0.2554047548713003,
    "reward_max": 10.73639071181727,
    "reward_min": -28.49268535637847,
    "reward_std": 8.908155255199018,
    "timesteps": 702731931,
    "learntime": 0.27175264712423086,
    "sampletime": 8.70655224705115,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1989,
    "reward_mean": 0.49953475678519865,
    "reward_max": 11.299195270858363,
    "reward_min": -25.65800029815485,
    "reward_std": 9.340107899476187,
    "timesteps": 703070184,
    "learntime": 0.3226788491010666,
    "sampletime": 8.553148926002905,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1990,
    "reward_mean": -0.6689107034172093,
    "reward_max": 10.843926791110512,
    "reward_min": -38.985607516786054,
    "reward_std": 10.595826842123946,
    "timesteps": 703406286,
    "learntime": 0.2715817391872406,
    "sampletime": 8.539516645949334,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1991,
    "reward_mean": -6.742107324703734,
    "reward_max": 9.830978351813327,
    "reward_min": -29.01127363863458,
    "reward_std": 10.337165570442268,
    "timesteps": 703727820,
    "learntime": 0.3083879789337516,
    "sampletime": 8.378781438106671,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1992,
    "reward_mean": -2.8843474202388757,
    "reward_max": 10.595238588174752,
    "reward_min": -29.112788506659637,
    "reward_std": 9.780710403025395,
    "timesteps": 704059221,
    "learntime": 0.28115400997921824,
    "sampletime": 8.541560858022422,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1993,
    "reward_mean": -4.851244722631211,
    "reward_max": 10.825623876754296,
    "reward_min": -34.201552751281675,
    "reward_std": 10.057958531063816,
    "timesteps": 704385723,
    "learntime": 0.32342161796987057,
    "sampletime": 8.487547661876306,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1994,
    "reward_mean": -0.8641428360948664,
    "reward_max": 10.617198862983829,
    "reward_min": -20.724783518415123,
    "reward_std": 8.91783788646787,
    "timesteps": 704721357,
    "learntime": 0.2751511230599135,
    "sampletime": 8.507129394914955,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1995,
    "reward_mean": -5.877598008587838,
    "reward_max": 9.900365022533206,
    "reward_min": -30.14630947260638,
    "reward_std": 10.959808707158855,
    "timesteps": 705044565,
    "learntime": 0.3310164080467075,
    "sampletime": 8.367832609917969,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1996,
    "reward_mean": -6.990685141366248,
    "reward_max": 9.510411357882221,
    "reward_min": -30.22415097026775,
    "reward_std": 9.066444693065332,
    "timesteps": 705365052,
    "learntime": 0.30683372798375785,
    "sampletime": 8.326038283063099,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1997,
    "reward_mean": -5.047280311008613,
    "reward_max": 9.781154954319138,
    "reward_min": -34.97949625023305,
    "reward_std": 9.92526415049628,
    "timesteps": 705690930,
    "learntime": 0.2669767700135708,
    "sampletime": 8.643602344207466,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1998,
    "reward_mean": -2.474302610884573,
    "reward_max": 9.959248052042144,
    "reward_min": -38.40947592875984,
    "reward_std": 9.95469357030993,
    "timesteps": 706023540,
    "learntime": 0.26313459617085755,
    "sampletime": 8.472705831052735,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 1999,
    "reward_mean": -6.919110844739328,
    "reward_max": 9.16515444298986,
    "reward_min": -43.80634301398337,
    "reward_std": 11.011386627334128,
    "timesteps": 706345368,
    "learntime": 0.2661049028392881,
    "sampletime": 8.238932015839964,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  },
  {
    "gen": 2000,
    "reward_mean": -0.767518679041051,
    "reward_max": 8.856969290356517,
    "reward_min": -30.55159458102902,
    "reward_std": 9.282095401444035,
    "timesteps": 706683864,
    "learntime": 0.32562894909642637,
    "sampletime": 8.547876436030492,
    "best_max_mean": 13.642681692213058,
    "best_max": 25.03806481092599
  }
]