[
  {
    "gen": 1,
    "reward_mean": -102.38994204638064,
    "reward_max": -85.78293815424496,
    "reward_min": -107.7362176503591,
    "reward_std": 5.336278943221367,
    "timesteps": 46131,
    "learntime": 0.6521104341372848,
    "sampletime": 1.7745423871092498,
    "best_max_mean": -102.38994204638064,
    "best_max": -85.78293815424496
  },
  {
    "gen": 2,
    "reward_mean": -98.87746771859105,
    "reward_max": -75.0038542570264,
    "reward_min": -106.92669570522213,
    "reward_std": 8.38043333365588,
    "timesteps": 104445,
    "learntime": 0.19226706912741065,
    "sampletime": 2.0712825539521873,
    "best_max_mean": -98.87746771859105,
    "best_max": -75.0038542570264
  },
  {
    "gen": 3,
    "reward_mean": -99.60057819517064,
    "reward_max": -71.27210509140019,
    "reward_min": -106.92210351345551,
    "reward_std": 9.034415528427255,
    "timesteps": 159534,
    "learntime": 0.1297527130227536,
    "sampletime": 2.179037116933614,
    "best_max_mean": -99.60057819517064,
    "best_max": -71.27210509140019
  },
  {
    "gen": 4,
    "reward_mean": -101.2176601159924,
    "reward_max": -65.16843225533904,
    "reward_min": -106.61777130632915,
    "reward_std": 7.486637971714725,
    "timesteps": 206073,
    "learntime": 0.1314756809733808,
    "sampletime": 1.4934538789093494,
    "best_max_mean": -101.2176601159924,
    "best_max": -65.16843225533904
  },
  {
    "gen": 5,
    "reward_mean": -101.65495703856585,
    "reward_max": -75.96398201533663,
    "reward_min": -107.27555255541068,
    "reward_std": 6.530488234217195,
    "timesteps": 255372,
    "learntime": 0.17158709093928337,
    "sampletime": 2.0291690649464726,
    "best_max_mean": -101.2176601159924,
    "best_max": -65.16843225533904
  },
  {
    "gen": 6,
    "reward_mean": -98.9521998237791,
    "reward_max": -71.26730342517192,
    "reward_min": -107.7080989997326,
    "reward_std": 8.500026275739765,
    "timesteps": 308571,
    "learntime": 0.11807736800983548,
    "sampletime": 1.9996238711755723,
    "best_max_mean": -101.2176601159924,
    "best_max": -65.16843225533904
  },
  {
    "gen": 7,
    "reward_mean": -99.58582380323205,
    "reward_max": -65.48651768971291,
    "reward_min": -106.89405201994425,
    "reward_std": 9.017732430561066,
    "timesteps": 364761,
    "learntime": 0.1757079961244017,
    "sampletime": 2.1340599621180445,
    "best_max_mean": -101.2176601159924,
    "best_max": -65.16843225533904
  },
  {
    "gen": 8,
    "reward_mean": -97.0277302524768,
    "reward_max": -64.06369167835113,
    "reward_min": -107.77877366666993,
    "reward_std": 9.456374919132495,
    "timesteps": 430275,
    "learntime": 0.14844789006747305,
    "sampletime": 2.717060575960204,
    "best_max_mean": -97.0277302524768,
    "best_max": -64.06369167835113
  },
  {
    "gen": 9,
    "reward_mean": -88.93528089997315,
    "reward_max": -48.41550483739454,
    "reward_min": -106.00306195074296,
    "reward_std": 16.15328314281969,
    "timesteps": 517482,
    "learntime": 0.17656322289258242,
    "sampletime": 3.077022103825584,
    "best_max_mean": -88.93528089997315,
    "best_max": -48.41550483739454
  },
  {
    "gen": 10,
    "reward_mean": -97.7850168084176,
    "reward_max": -56.13470308608234,
    "reward_min": -106.9795834791254,
    "reward_std": 10.297551833955657,
    "timesteps": 573873,
    "learntime": 0.12921444000676274,
    "sampletime": 2.5741116949357092,
    "best_max_mean": -88.93528089997315,
    "best_max": -48.41550483739454
  },
  {
    "gen": 11,
    "reward_mean": -87.2773422771794,
    "reward_max": -57.79720460939589,
    "reward_min": -105.9365183078176,
    "reward_std": 14.769305267636927,
    "timesteps": 664392,
    "learntime": 0.1714509129524231,
    "sampletime": 3.371495700906962,
    "best_max_mean": -88.93528089997315,
    "best_max": -48.41550483739454
  },
  {
    "gen": 12,
    "reward_mean": -80.42094375647807,
    "reward_max": -27.60276943081144,
    "reward_min": -105.6781937026447,
    "reward_std": 17.863412825985527,
    "timesteps": 781977,
    "learntime": 0.11230825399979949,
    "sampletime": 3.696625357028097,
    "best_max_mean": -80.42094375647807,
    "best_max": -27.60276943081144
  },
  {
    "gen": 13,
    "reward_mean": -87.72489389132404,
    "reward_max": -35.7486622160597,
    "reward_min": -104.72366602052676,
    "reward_std": 13.737252647383496,
    "timesteps": 867792,
    "learntime": 0.1876778700388968,
    "sampletime": 2.768368168035522,
    "best_max_mean": -80.42094375647807,
    "best_max": -27.60276943081144
  },
  {
    "gen": 14,
    "reward_mean": -73.09934387798369,
    "reward_max": -27.192279244222764,
    "reward_min": -105.81903668852861,
    "reward_std": 20.82300250068368,
    "timesteps": 996285,
    "learntime": 0.11485506989993155,
    "sampletime": 4.792063041822985,
    "best_max_mean": -73.09934387798369,
    "best_max": -27.192279244222764
  },
  {
    "gen": 15,
    "reward_mean": -70.19649255630549,
    "reward_max": 2.038026873036428,
    "reward_min": -104.54970959123847,
    "reward_std": 19.696779954194778,
    "timesteps": 1135209,
    "learntime": 0.17028308706358075,
    "sampletime": 4.675073759863153,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 16,
    "reward_mean": -66.28953162540066,
    "reward_max": -25.654304838221936,
    "reward_min": -105.06073446698825,
    "reward_std": 20.763560450475904,
    "timesteps": 1287507,
    "learntime": 0.13079651212319732,
    "sampletime": 4.758382737170905,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 17,
    "reward_mean": -56.46292248290599,
    "reward_max": -26.285616007435955,
    "reward_min": -103.94754674692045,
    "reward_std": 17.527737724338785,
    "timesteps": 1469853,
    "learntime": 0.168558144941926,
    "sampletime": 6.030570604838431,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 18,
    "reward_mean": -56.65340986580772,
    "reward_max": -18.630662049166858,
    "reward_min": -103.84975305801454,
    "reward_std": 17.12917695506961,
    "timesteps": 1652412,
    "learntime": 0.1461617909371853,
    "sampletime": 4.918839840916917,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 19,
    "reward_mean": -64.27318182043786,
    "reward_max": -27.532143769630547,
    "reward_min": -104.19052099531065,
    "reward_std": 19.30834453749585,
    "timesteps": 1813989,
    "learntime": 0.16120150685310364,
    "sampletime": 5.03311446798034,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 20,
    "reward_mean": -53.88590894887239,
    "reward_max": -9.949309100312266,
    "reward_min": -93.97195758591548,
    "reward_std": 18.801988237921837,
    "timesteps": 2004750,
    "learntime": 0.13689217693172395,
    "sampletime": 5.756852702004835,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 21,
    "reward_mean": -54.67908825287088,
    "reward_max": -27.73553565392892,
    "reward_min": -94.60309190953603,
    "reward_std": 15.1277704887685,
    "timesteps": 2192406,
    "learntime": 0.15812106593512,
    "sampletime": 6.461125765927136,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 22,
    "reward_mean": -56.214122348593875,
    "reward_max": -10.258356088828863,
    "reward_min": -95.07827982012972,
    "reward_std": 16.883999753068835,
    "timesteps": 2376036,
    "learntime": 0.12767783901654184,
    "sampletime": 5.778592320159078,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 23,
    "reward_mean": -49.97193416491082,
    "reward_max": -7.984028022736311,
    "reward_min": -104.40096804536316,
    "reward_std": 19.567580376681533,
    "timesteps": 2578344,
    "learntime": 0.1580877429805696,
    "sampletime": 5.371665463084355,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 24,
    "reward_mean": -45.973636347988695,
    "reward_max": 0.8685248612309789,
    "reward_min": -85.73624557396397,
    "reward_std": 19.198646745120275,
    "timesteps": 2794860,
    "learntime": 0.12024719198234379,
    "sampletime": 6.141410492127761,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 25,
    "reward_mean": -39.502262391974895,
    "reward_max": -8.971229608706906,
    "reward_min": -76.17843568526828,
    "reward_std": 14.273361391918257,
    "timesteps": 3029601,
    "learntime": 0.16682030400261283,
    "sampletime": 6.385622612899169,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 26,
    "reward_mean": -35.38652359541666,
    "reward_max": 0.5135713027028174,
    "reward_min": -78.52739012406933,
    "reward_std": 17.687544327027673,
    "timesteps": 3278337,
    "learntime": 0.11845576390624046,
    "sampletime": 6.693728982936591,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 27,
    "reward_mean": -44.449549833335716,
    "reward_max": -17.82874547238603,
    "reward_min": -76.04549739938794,
    "reward_std": 14.421309428354922,
    "timesteps": 3500604,
    "learntime": 0.1797730380203575,
    "sampletime": 6.507128495024517,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 28,
    "reward_mean": -47.40337869372617,
    "reward_max": -8.213795739395374,
    "reward_min": -84.98092117191602,
    "reward_std": 19.261669578666485,
    "timesteps": 3710733,
    "learntime": 0.11464813607744873,
    "sampletime": 6.1374259339645505,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 29,
    "reward_mean": -52.374007311149555,
    "reward_max": -8.547987124315556,
    "reward_min": -94.73693626404346,
    "reward_std": 19.542515636150597,
    "timesteps": 3905619,
    "learntime": 0.1767527109477669,
    "sampletime": 5.608256534207612,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 30,
    "reward_mean": -47.844439884452626,
    "reward_max": -17.99338314646968,
    "reward_min": -84.93164482170886,
    "reward_std": 17.108700055893063,
    "timesteps": 4116171,
    "learntime": 0.12079937802627683,
    "sampletime": 6.205006408970803,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 31,
    "reward_mean": -39.17696359531341,
    "reward_max": -7.5873968389609665,
    "reward_min": -104.33252508345653,
    "reward_std": 19.74578112019199,
    "timesteps": 4352808,
    "learntime": 0.16962169692851603,
    "sampletime": 6.612141807097942,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 32,
    "reward_mean": -40.41490456587953,
    "reward_max": 0.6760913394953734,
    "reward_min": -83.8787130974233,
    "reward_std": 19.05939557977212,
    "timesteps": 4584423,
    "learntime": 0.11335350200533867,
    "sampletime": 6.2906988330651075,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 33,
    "reward_mean": -33.52666722504095,
    "reward_max": -0.14811956309454946,
    "reward_min": -65.86744315419911,
    "reward_std": 15.99516201653817,
    "timesteps": 4838892,
    "learntime": 0.1652961759828031,
    "sampletime": 6.645601129159331,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 34,
    "reward_mean": -37.0108426661061,
    "reward_max": 0.3414849525098816,
    "reward_min": -75.99715627461786,
    "reward_std": 18.140635641991107,
    "timesteps": 5082918,
    "learntime": 0.1327598369680345,
    "sampletime": 6.7461068069096655,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 35,
    "reward_mean": -31.673934213079093,
    "reward_max": 0.29029221236917063,
    "reward_min": -101.35318438858359,
    "reward_std": 18.25740566354652,
    "timesteps": 5342892,
    "learntime": 0.17409130581654608,
    "sampletime": 7.216084808809683,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 36,
    "reward_mean": -20.596387028474382,
    "reward_max": 1.4338661646549762,
    "reward_min": -51.81269219430221,
    "reward_std": 13.067138984481996,
    "timesteps": 5638923,
    "learntime": 0.1148284140508622,
    "sampletime": 7.630363221978769,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 37,
    "reward_mean": -29.4752695795391,
    "reward_max": 1.1517201887415423,
    "reward_min": -76.38338478639099,
    "reward_std": 18.64440255799288,
    "timesteps": 5904915,
    "learntime": 0.165883578825742,
    "sampletime": 7.167952107032761,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 38,
    "reward_mean": -25.287716592062573,
    "reward_max": 1.2231071980667423,
    "reward_min": -65.99550244607256,
    "reward_std": 16.044298556242726,
    "timesteps": 6190716,
    "learntime": 0.12406880990602076,
    "sampletime": 7.373939337907359,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 39,
    "reward_mean": -11.596995678121061,
    "reward_max": 1.4222444697645376,
    "reward_min": -57.78689074206914,
    "reward_std": 10.974404566484257,
    "timesteps": 6516369,
    "learntime": 0.1665782150812447,
    "sampletime": 8.125510447891429,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 40,
    "reward_mean": -20.72170670758458,
    "reward_max": 0.8905043049440272,
    "reward_min": -75.39002646708326,
    "reward_std": 14.516262079433536,
    "timesteps": 6814203,
    "learntime": 0.12002840591594577,
    "sampletime": 7.629504435928538,
    "best_max_mean": -70.19649255630549,
    "best_max": 2.038026873036428
  },
  {
    "gen": 41,
    "reward_mean": -10.651242528363127,
    "reward_max": 2.0419432839419924,
    "reward_min": -49.725032747283365,
    "reward_std": 11.753708216688016,
    "timesteps": 7145211,
    "learntime": 0.18074694089591503,
    "sampletime": 8.047699023038149,
    "best_max_mean": -10.651242528363127,
    "best_max": 2.0419432839419924
  },
  {
    "gen": 42,
    "reward_mean": -4.181951147291855,
    "reward_max": 2.2129296977331627,
    "reward_min": -27.09957153613725,
    "reward_std": 6.997478891260294,
    "timesteps": 7492026,
    "learntime": 0.1276325359940529,
    "sampletime": 8.288728979881853,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 43,
    "reward_mean": -3.8453899021074465,
    "reward_max": 2.0899661730307098,
    "reward_min": -26.780295251163114,
    "reward_std": 6.60951742207531,
    "timesteps": 7839249,
    "learntime": 0.1653220800217241,
    "sampletime": 8.423587512923405,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 44,
    "reward_mean": -2.95656072162115,
    "reward_max": 2.127227258764445,
    "reward_min": -47.55577632858927,
    "reward_std": 8.05084569620544,
    "timesteps": 8189109,
    "learntime": 0.11141704116016626,
    "sampletime": 8.410569183062762,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 45,
    "reward_mean": -1.1586074313807209,
    "reward_max": 2.0507708590610254,
    "reward_min": -17.769815113776446,
    "reward_std": 4.396912618060163,
    "timesteps": 8543046,
    "learntime": 0.16682794014923275,
    "sampletime": 8.452907832106575,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 46,
    "reward_mean": 0.8758083467020369,
    "reward_max": 2.0418922907362367,
    "reward_min": -17.2220408182563,
    "reward_std": 2.5729674644354414,
    "timesteps": 8902713,
    "learntime": 0.12256750604137778,
    "sampletime": 8.506605970906094,
    "best_max_mean": -4.181951147291855,
    "best_max": 2.2129296977331627
  },
  {
    "gen": 47,
    "reward_mean": -2.165411959787625,
    "reward_max": 2.2421953672036925,
    "reward_min": -34.71552958687729,
    "reward_std": 6.939037190707742,
    "timesteps": 9254568,
    "learntime": 0.166214345023036,
    "sampletime": 8.400415963958949,
    "best_max_mean": -2.165411959787625,
    "best_max": 2.2421953672036925
  },
  {
    "gen": 48,
    "reward_mean": 1.474219021535204,
    "reward_max": 2.1087811529933873,
    "reward_min": 0.03495460979885825,
    "reward_std": 0.30848162974336935,
    "timesteps": 9615288,
    "learntime": 0.12544223805889487,
    "sampletime": 8.612950601847842,
    "best_max_mean": -2.165411959787625,
    "best_max": 2.2421953672036925
  },
  {
    "gen": 49,
    "reward_mean": 1.1228624132698484,
    "reward_max": 2.065879017859007,
    "reward_min": -8.419802303835628,
    "reward_std": 1.997494343207942,
    "timesteps": 9974748,
    "learntime": 0.1980799320153892,
    "sampletime": 8.517408717190847,
    "best_max_mean": -2.165411959787625,
    "best_max": 2.2421953672036925
  },
  {
    "gen": 50,
    "reward_mean": -0.4769958233704735,
    "reward_max": 1.9337291791012026,
    "reward_min": -22.70244519318739,
    "reward_std": 4.728403407859763,
    "timesteps": 10331505,
    "learntime": 0.12700117682106793,
    "sampletime": 8.476811971049756,
    "best_max_mean": -2.165411959787625,
    "best_max": 2.2421953672036925
  },
  {
    "gen": 51,
    "reward_mean": 1.235418092813611,
    "reward_max": 2.2578653277843377,
    "reward_min": -9.383352967367198,
    "reward_std": 2.139425968504328,
    "timesteps": 10690977,
    "learntime": 0.1779136119876057,
    "sampletime": 8.494561285944656,
    "best_max_mean": 1.235418092813611,
    "best_max": 2.2578653277843377
  },
  {
    "gen": 52,
    "reward_mean": 1.06584610330267,
    "reward_max": 2.20397818291729,
    "reward_min": -7.747818761258248,
    "reward_std": 1.928172385264683,
    "timesteps": 11051067,
    "learntime": 0.1284502102062106,
    "sampletime": 8.532853039214388,
    "best_max_mean": 1.235418092813611,
    "best_max": 2.2578653277843377
  },
  {
    "gen": 53,
    "reward_mean": 0.9758177601469334,
    "reward_max": 2.205417457982106,
    "reward_min": -7.497108487066617,
    "reward_std": 2.6355445262342925,
    "timesteps": 11409255,
    "learntime": 0.17148346593603492,
    "sampletime": 8.448904996970668,
    "best_max_mean": 1.235418092813611,
    "best_max": 2.2578653277843377
  },
  {
    "gen": 54,
    "reward_mean": 0.9977810815060011,
    "reward_max": 2.140227806091195,
    "reward_min": -16.233687034666108,
    "reward_std": 3.356812948335024,
    "timesteps": 11767578,
    "learntime": 0.115964625030756,
    "sampletime": 8.544124722015113,
    "best_max_mean": 1.235418092813611,
    "best_max": 2.2578653277843377
  },
  {
    "gen": 55,
    "reward_mean": 1.6057211638531097,
    "reward_max": 2.4207475148864543,
    "reward_min": -3.7977498569067207,
    "reward_std": 0.8803230362857044,
    "timesteps": 12128298,
    "learntime": 0.16656083497218788,
    "sampletime": 8.546651341952384,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 56,
    "reward_mean": 1.3496704086576812,
    "reward_max": 2.2051075713349166,
    "reward_min": -7.090324603982566,
    "reward_std": 1.8662554718612063,
    "timesteps": 12487875,
    "learntime": 0.13360372395254672,
    "sampletime": 8.542620355961844,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 57,
    "reward_mean": 1.8394492048340176,
    "reward_max": 2.283127114550687,
    "reward_min": 1.5234195190220774,
    "reward_std": 0.15553942276844981,
    "timesteps": 12848595,
    "learntime": 0.18163597490638494,
    "sampletime": 8.584283116972074,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 58,
    "reward_mean": 1.064805427801108,
    "reward_max": 2.252194483041282,
    "reward_min": -13.942375453885896,
    "reward_std": 2.863474234895718,
    "timesteps": 13206867,
    "learntime": 0.12345976894721389,
    "sampletime": 8.49074229807593,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 59,
    "reward_mean": 1.8398472224200517,
    "reward_max": 2.081085004746757,
    "reward_min": 1.5025827772421452,
    "reward_std": 0.126632512833579,
    "timesteps": 13567587,
    "learntime": 0.17769214301370084,
    "sampletime": 8.513964754063636,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 60,
    "reward_mean": 1.8379090197514878,
    "reward_max": 2.083551095486844,
    "reward_min": 1.539532783355549,
    "reward_std": 0.1295365428720181,
    "timesteps": 13928307,
    "learntime": 0.11551481718197465,
    "sampletime": 8.614011953119189,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 61,
    "reward_mean": 1.8196659655521907,
    "reward_max": 2.114109133888355,
    "reward_min": 1.5542171989765097,
    "reward_std": 0.1267809965767768,
    "timesteps": 14289027,
    "learntime": 0.1729039230849594,
    "sampletime": 8.557736401911825,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 62,
    "reward_mean": 1.373646314579484,
    "reward_max": 2.100014968201952,
    "reward_min": -7.289584486533636,
    "reward_std": 1.8464151240742732,
    "timesteps": 14648697,
    "learntime": 0.11671559396199882,
    "sampletime": 8.599367182934657,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 63,
    "reward_mean": 1.833711796656752,
    "reward_max": 2.1358767444387774,
    "reward_min": 1.4592537950520625,
    "reward_std": 0.15214980310383008,
    "timesteps": 15009417,
    "learntime": 0.16845654416829348,
    "sampletime": 8.618467933032662,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 64,
    "reward_mean": 1.4101507352344262,
    "reward_max": 2.1684154354134604,
    "reward_min": -15.54409994794917,
    "reward_std": 2.3912561896743174,
    "timesteps": 15368985,
    "learntime": 0.11648368602618575,
    "sampletime": 8.558193278964609,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 65,
    "reward_mean": 1.340498472521806,
    "reward_max": 2.0701214816261864,
    "reward_min": -7.711417927551367,
    "reward_std": 1.984719518272824,
    "timesteps": 15728628,
    "learntime": 0.1728608498815447,
    "sampletime": 8.537202962907031,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 66,
    "reward_mean": 1.8672699945939542,
    "reward_max": 2.2606180890607974,
    "reward_min": 1.6340927164005572,
    "reward_std": 0.11186410262587987,
    "timesteps": 16089348,
    "learntime": 0.11969152605161071,
    "sampletime": 8.599834345048293,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 67,
    "reward_mean": -1.1299414572408004,
    "reward_max": 2.2208359594153437,
    "reward_min": -61.78228093980754,
    "reward_std": 8.483548023937297,
    "timesteps": 16441077,
    "learntime": 0.1829174179583788,
    "sampletime": 8.371822418877855,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 68,
    "reward_mean": 1.7361502219121918,
    "reward_max": 2.1349470761417617,
    "reward_min": 1.1805517271312747,
    "reward_std": 0.18207160445440204,
    "timesteps": 16801797,
    "learntime": 0.12319314596243203,
    "sampletime": 8.528967777034268,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 69,
    "reward_mean": 1.7743528771293597,
    "reward_max": 2.073502242852664,
    "reward_min": 1.4803373964589817,
    "reward_std": 0.13882392350899248,
    "timesteps": 17162517,
    "learntime": 0.17494099796749651,
    "sampletime": 8.451502357143909,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 70,
    "reward_mean": 1.8131955782343556,
    "reward_max": 2.178854902402637,
    "reward_min": 1.395625891021951,
    "reward_std": 0.1448243656611982,
    "timesteps": 17523237,
    "learntime": 0.12339163711294532,
    "sampletime": 8.619408296886832,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 71,
    "reward_mean": 1.8028914600126653,
    "reward_max": 2.1804728198829126,
    "reward_min": 1.4966462738247506,
    "reward_std": 0.1527649646819695,
    "timesteps": 17883957,
    "learntime": 0.17727100709453225,
    "sampletime": 8.519222777104005,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 72,
    "reward_mean": 1.7798444314080772,
    "reward_max": 2.2209375139562195,
    "reward_min": 1.2804822554444923,
    "reward_std": 0.16140593879752588,
    "timesteps": 18244677,
    "learntime": 0.10930071608163416,
    "sampletime": 8.571627190103754,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 73,
    "reward_mean": 1.8131424829518221,
    "reward_max": 2.169663594505186,
    "reward_min": 1.4153380829798548,
    "reward_std": 0.16359699247361562,
    "timesteps": 18605397,
    "learntime": 0.16324011702090502,
    "sampletime": 8.525993510847911,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 74,
    "reward_mean": 1.7721635360733752,
    "reward_max": 2.22744338652895,
    "reward_min": 1.3434381998129956,
    "reward_std": 0.15202170306135523,
    "timesteps": 18966117,
    "learntime": 0.11725977389141917,
    "sampletime": 8.658692136174068,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 75,
    "reward_mean": 1.7833131057144005,
    "reward_max": 2.129017093834229,
    "reward_min": 1.4916072738018207,
    "reward_std": 0.1447651098977334,
    "timesteps": 19326837,
    "learntime": 0.18195763300172985,
    "sampletime": 8.524164255941287,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 76,
    "reward_mean": 1.8468159781136944,
    "reward_max": 2.2148500320116793,
    "reward_min": 1.5205648770083096,
    "reward_std": 0.1452164582558042,
    "timesteps": 19687557,
    "learntime": 0.13011276815086603,
    "sampletime": 8.537294728914276,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 77,
    "reward_mean": 1.875189914659899,
    "reward_max": 2.173421370014287,
    "reward_min": 1.5920841820382812,
    "reward_std": 0.13778882876281448,
    "timesteps": 20048277,
    "learntime": 0.18312120996415615,
    "sampletime": 8.661530527984723,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 78,
    "reward_mean": 1.858387611583331,
    "reward_max": 2.243866981488984,
    "reward_min": 1.544122258987924,
    "reward_std": 0.1430213160280324,
    "timesteps": 20408997,
    "learntime": 0.12462396104820073,
    "sampletime": 8.531057198997587,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 79,
    "reward_mean": 1.8084033523809782,
    "reward_max": 2.182752132122967,
    "reward_min": 1.439010003366449,
    "reward_std": 0.136820660385389,
    "timesteps": 20769717,
    "learntime": 0.1709197978489101,
    "sampletime": 8.651979650836438,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 80,
    "reward_mean": 1.8001204213655462,
    "reward_max": 2.133700546013915,
    "reward_min": 1.544654642522798,
    "reward_std": 0.13405386638830866,
    "timesteps": 21130437,
    "learntime": 0.12446194794028997,
    "sampletime": 8.521717669907957,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 81,
    "reward_mean": 1.7228461246781726,
    "reward_max": 2.018473058539622,
    "reward_min": 1.3979099988796226,
    "reward_std": 0.14148584713815315,
    "timesteps": 21491157,
    "learntime": 0.16308499407023191,
    "sampletime": 8.621202594833449,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 82,
    "reward_mean": 1.8058298452057588,
    "reward_max": 2.2431676187967002,
    "reward_min": 1.3525008876499147,
    "reward_std": 0.18146990432110008,
    "timesteps": 21851877,
    "learntime": 0.12156063504517078,
    "sampletime": 8.498194295912981,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 83,
    "reward_mean": 1.3624802576035977,
    "reward_max": 2.109834511918859,
    "reward_min": -7.769504370428906,
    "reward_std": 1.918145262459881,
    "timesteps": 22211367,
    "learntime": 0.18444432388059795,
    "sampletime": 8.701322741806507,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 84,
    "reward_mean": 1.7890955357205502,
    "reward_max": 2.171789818006357,
    "reward_min": 1.2798715458696004,
    "reward_std": 0.15481800086739755,
    "timesteps": 22572087,
    "learntime": 0.11633399198763072,
    "sampletime": 8.542336189886555,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 85,
    "reward_mean": 1.8134314654963024,
    "reward_max": 2.1162871697536776,
    "reward_min": 1.489877415190371,
    "reward_std": 0.1350532049259689,
    "timesteps": 22932807,
    "learntime": 0.17006435804069042,
    "sampletime": 8.448816492920741,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 86,
    "reward_mean": 1.8675373582481507,
    "reward_max": 2.258833254038383,
    "reward_min": 1.4745876679727268,
    "reward_std": 0.1678663225129436,
    "timesteps": 23293527,
    "learntime": 0.11662047985009849,
    "sampletime": 8.578343705041334,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 87,
    "reward_mean": 1.7389489847954094,
    "reward_max": 2.146414571921479,
    "reward_min": 1.4106479467309045,
    "reward_std": 0.15343912034526466,
    "timesteps": 23654247,
    "learntime": 0.15947056096047163,
    "sampletime": 8.591366678010672,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 88,
    "reward_mean": 1.4175039568593473,
    "reward_max": 2.3283660152898817,
    "reward_min": -7.296586049889976,
    "reward_std": 1.902376416847704,
    "timesteps": 24013821,
    "learntime": 0.1193503700196743,
    "sampletime": 8.748246036004275,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 89,
    "reward_mean": 1.798943645347069,
    "reward_max": 2.3486523548474163,
    "reward_min": 1.446018485987388,
    "reward_std": 0.14514749022339635,
    "timesteps": 24374541,
    "learntime": 0.1714224498718977,
    "sampletime": 8.568466129014269,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 90,
    "reward_mean": 1.8339495438901423,
    "reward_max": 2.4054319046201376,
    "reward_min": 1.465655304421845,
    "reward_std": 0.1940664020672639,
    "timesteps": 24735261,
    "learntime": 0.12723142001777887,
    "sampletime": 8.48531078104861,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 91,
    "reward_mean": 1.8387236121078456,
    "reward_max": 2.1885382484320077,
    "reward_min": 1.55346398978468,
    "reward_std": 0.14235106644414702,
    "timesteps": 25095981,
    "learntime": 0.17794163199141622,
    "sampletime": 8.597119064070284,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 92,
    "reward_mean": 1.8665838478869494,
    "reward_max": 2.245465357407792,
    "reward_min": 1.4527137431238444,
    "reward_std": 0.15815032081736524,
    "timesteps": 25456701,
    "learntime": 0.11786225391551852,
    "sampletime": 8.618908952921629,
    "best_max_mean": 1.6057211638531097,
    "best_max": 2.4207475148864543
  },
  {
    "gen": 93,
    "reward_mean": 1.8438424855624782,
    "reward_max": 2.4353959641779146,
    "reward_min": 1.536308085814885,
    "reward_std": 0.1699529930956924,
    "timesteps": 25817421,
    "learntime": 0.1604542271234095,
    "sampletime": 8.617406100034714,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 94,
    "reward_mean": 1.8292762950906805,
    "reward_max": 2.1821598251101944,
    "reward_min": 1.5680882043035844,
    "reward_std": 0.16088479185926388,
    "timesteps": 26178141,
    "learntime": 0.12374753202311695,
    "sampletime": 8.59695308888331,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 95,
    "reward_mean": 1.8605830274404083,
    "reward_max": 2.1532385282334854,
    "reward_min": 1.5206885039870999,
    "reward_std": 0.15175691072009528,
    "timesteps": 26538861,
    "learntime": 0.18823391408659518,
    "sampletime": 8.631118158111349,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 96,
    "reward_mean": 1.3577479990887065,
    "reward_max": 2.076310939946612,
    "reward_min": -7.318889287591009,
    "reward_std": 1.8859397950611951,
    "timesteps": 26898420,
    "learntime": 0.1278820619918406,
    "sampletime": 8.44307671696879,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 97,
    "reward_mean": 1.8201028433018165,
    "reward_max": 2.131878993936078,
    "reward_min": 1.5026805244393218,
    "reward_std": 0.13349971976073355,
    "timesteps": 27259140,
    "learntime": 0.18695478094741702,
    "sampletime": 8.59372456301935,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 98,
    "reward_mean": 1.8549824600003717,
    "reward_max": 2.136833842939018,
    "reward_min": 1.5350975805336142,
    "reward_std": 0.13277104762907085,
    "timesteps": 27619860,
    "learntime": 0.12225809111259878,
    "sampletime": 8.577332088025287,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 99,
    "reward_mean": 1.8135750688300383,
    "reward_max": 2.1920612261270747,
    "reward_min": 1.387476075348921,
    "reward_std": 0.15192984733908238,
    "timesteps": 27980580,
    "learntime": 0.16515815583989024,
    "sampletime": 8.503913890803233,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 100,
    "reward_mean": 1.4044047532073505,
    "reward_max": 2.226917915287862,
    "reward_min": -6.838007699754655,
    "reward_std": 1.8205225706750456,
    "timesteps": 28340232,
    "learntime": 0.12187952199019492,
    "sampletime": 8.478467751061544,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 101,
    "reward_mean": 1.3598318627057286,
    "reward_max": 2.1721114438259956,
    "reward_min": -7.169738280922034,
    "reward_std": 1.7853568664028416,
    "timesteps": 28699707,
    "learntime": 0.16002440778538585,
    "sampletime": 8.567252045031637,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 102,
    "reward_mean": 1.8199854286871333,
    "reward_max": 2.0817132094381305,
    "reward_min": 1.5533917929543242,
    "reward_std": 0.13446122234312757,
    "timesteps": 29060427,
    "learntime": 0.11621881392784417,
    "sampletime": 8.687449957011268,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 103,
    "reward_mean": 1.8055615684179755,
    "reward_max": 2.124750659284301,
    "reward_min": 1.3458421353575274,
    "reward_std": 0.1651659445448548,
    "timesteps": 29421147,
    "learntime": 0.1707536408212036,
    "sampletime": 8.51169870607555,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 104,
    "reward_mean": 1.7910449023467274,
    "reward_max": 2.0258040348408275,
    "reward_min": 1.3622720861916802,
    "reward_std": 0.13859643003273672,
    "timesteps": 29781867,
    "learntime": 0.12426668591797352,
    "sampletime": 8.516797719988972,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 105,
    "reward_mean": 1.800558428484063,
    "reward_max": 2.2136412065337905,
    "reward_min": 1.4448020156689563,
    "reward_std": 0.14925180567402585,
    "timesteps": 30142587,
    "learntime": 0.17554671899415553,
    "sampletime": 8.636691699037328,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 106,
    "reward_mean": 1.7902239106963127,
    "reward_max": 2.089369299380585,
    "reward_min": 1.183703992828887,
    "reward_std": 0.1586830711722602,
    "timesteps": 30503307,
    "learntime": 0.11710999812930822,
    "sampletime": 8.50351895717904,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 107,
    "reward_mean": 1.8295275469751062,
    "reward_max": 2.2703465727068792,
    "reward_min": 1.4687864040930014,
    "reward_std": 0.1460255071046036,
    "timesteps": 30864027,
    "learntime": 0.1776225280482322,
    "sampletime": 8.617527287919074,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 108,
    "reward_mean": 1.8425188061994344,
    "reward_max": 2.1560485464352563,
    "reward_min": 1.441508987227056,
    "reward_std": 0.14126496038746736,
    "timesteps": 31224747,
    "learntime": 0.12139158300124109,
    "sampletime": 8.541982716182247,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 109,
    "reward_mean": 1.805019450860995,
    "reward_max": 2.118811530823057,
    "reward_min": 1.3966747252729155,
    "reward_std": 0.14767219667525436,
    "timesteps": 31585467,
    "learntime": 0.179976352956146,
    "sampletime": 8.617684266995639,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 110,
    "reward_mean": 1.439344981347884,
    "reward_max": 2.2425230345062555,
    "reward_min": -7.218818652190476,
    "reward_std": 1.9155310110256285,
    "timesteps": 31945092,
    "learntime": 0.11681389017030597,
    "sampletime": 8.596420526038855,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 111,
    "reward_mean": 1.8465280063268383,
    "reward_max": 2.2088321682743026,
    "reward_min": 1.627031128186814,
    "reward_std": 0.13305904823492193,
    "timesteps": 32305812,
    "learntime": 0.17088635894469917,
    "sampletime": 8.509094073902816,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 112,
    "reward_mean": 1.8007712616722449,
    "reward_max": 2.131308844649921,
    "reward_min": 1.555153424796915,
    "reward_std": 0.12781357125086548,
    "timesteps": 32666532,
    "learntime": 0.11959966504946351,
    "sampletime": 8.549672375898808,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 113,
    "reward_mean": 1.8217953599032626,
    "reward_max": 2.1347633017170584,
    "reward_min": 1.3304064361833605,
    "reward_std": 0.16004004781244097,
    "timesteps": 33027252,
    "learntime": 0.16715350397862494,
    "sampletime": 8.449086138047278,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 114,
    "reward_mean": 1.4191529474335567,
    "reward_max": 2.1245686415285365,
    "reward_min": -7.080276738248252,
    "reward_std": 1.8652160750183377,
    "timesteps": 33386781,
    "learntime": 0.12336130510084331,
    "sampletime": 8.542289647040889,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 115,
    "reward_mean": 1.880896420046251,
    "reward_max": 2.2150219442233303,
    "reward_min": 1.431862945037814,
    "reward_std": 0.1492262081369713,
    "timesteps": 33747501,
    "learntime": 0.1744839500170201,
    "sampletime": 8.476458815159276,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 116,
    "reward_mean": 1.8164206625797064,
    "reward_max": 2.1748652970868076,
    "reward_min": 1.4140033409921933,
    "reward_std": 0.13546062390331495,
    "timesteps": 34108221,
    "learntime": 0.1275475020520389,
    "sampletime": 8.54848056891933,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 117,
    "reward_mean": 1.0055376375594922,
    "reward_max": 2.1854415414290416,
    "reward_min": -7.076859031777395,
    "reward_std": 2.464273481531437,
    "timesteps": 34467102,
    "learntime": 0.18480642698705196,
    "sampletime": 8.454242649953812,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 118,
    "reward_mean": 1.7717260978351637,
    "reward_max": 2.1777671850709734,
    "reward_min": 1.461604803073866,
    "reward_std": 0.1464708610418815,
    "timesteps": 34827822,
    "learntime": 0.11955668218433857,
    "sampletime": 8.4649139479734,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 119,
    "reward_mean": 1.775906827161965,
    "reward_max": 2.200581100966892,
    "reward_min": 1.5301259081117493,
    "reward_std": 0.15170622928184613,
    "timesteps": 35188542,
    "learntime": 0.1769234319217503,
    "sampletime": 8.597477860050276,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 120,
    "reward_mean": 1.8216991321540297,
    "reward_max": 2.3387817081300315,
    "reward_min": 1.5197425273686846,
    "reward_std": 0.17026673085273114,
    "timesteps": 35549262,
    "learntime": 0.12016564910300076,
    "sampletime": 8.589523673988879,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 121,
    "reward_mean": 1.7389701524698882,
    "reward_max": 2.0300018433005156,
    "reward_min": 1.4098240253652963,
    "reward_std": 0.14078044756113678,
    "timesteps": 35909982,
    "learntime": 0.17493627802468836,
    "sampletime": 8.63060511299409,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 122,
    "reward_mean": 1.8385915053882966,
    "reward_max": 2.285837875607254,
    "reward_min": 1.531838098198121,
    "reward_std": 0.16964652790739046,
    "timesteps": 36270702,
    "learntime": 0.1314127438236028,
    "sampletime": 8.51492344494909,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 123,
    "reward_mean": 1.373490063151034,
    "reward_max": 2.1917737298997824,
    "reward_min": -7.358886542948756,
    "reward_std": 1.9323476965364854,
    "timesteps": 36630216,
    "learntime": 0.1704225749708712,
    "sampletime": 8.687874163966626,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 124,
    "reward_mean": 1.8229135401269443,
    "reward_max": 2.2535321145269025,
    "reward_min": 1.3464659056061794,
    "reward_std": 0.16973182749624838,
    "timesteps": 36990936,
    "learntime": 0.11173146613873541,
    "sampletime": 8.550677887164056,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 125,
    "reward_mean": 1.849392754796286,
    "reward_max": 2.335297485402954,
    "reward_min": 1.5168953725515142,
    "reward_std": 0.15140861241400058,
    "timesteps": 37351656,
    "learntime": 0.16635238705202937,
    "sampletime": 8.525681413942948,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 126,
    "reward_mean": 1.4361281384142193,
    "reward_max": 2.1859497866698225,
    "reward_min": -6.750691706809451,
    "reward_std": 1.7692782915716685,
    "timesteps": 37711152,
    "learntime": 0.12707483186386526,
    "sampletime": 8.46155633800663,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 127,
    "reward_mean": 1.8471961142723474,
    "reward_max": 2.1622984294354493,
    "reward_min": 1.4889736503263855,
    "reward_std": 0.12891509758219263,
    "timesteps": 38071872,
    "learntime": 0.1699905728455633,
    "sampletime": 8.56606133794412,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 128,
    "reward_mean": 1.8447179916833552,
    "reward_max": 2.2063662793952985,
    "reward_min": 1.4751117881987168,
    "reward_std": 0.15259274369240017,
    "timesteps": 38432592,
    "learntime": 0.12245086207985878,
    "sampletime": 8.638600856997073,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 129,
    "reward_mean": 1.7922027347952976,
    "reward_max": 2.0811891052025264,
    "reward_min": 1.5476991579282275,
    "reward_std": 0.13269520448177194,
    "timesteps": 38793312,
    "learntime": 0.18253555102273822,
    "sampletime": 8.522918392904103,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 130,
    "reward_mean": 1.7931518693347512,
    "reward_max": 2.244028211370193,
    "reward_min": 1.4736206729836367,
    "reward_std": 0.1449438352927126,
    "timesteps": 39154032,
    "learntime": 0.11585272196680307,
    "sampletime": 8.67840020218864,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 131,
    "reward_mean": 1.7707630439451578,
    "reward_max": 2.1303212661910527,
    "reward_min": 1.4038748783415105,
    "reward_std": 0.1444169755878066,
    "timesteps": 39514752,
    "learntime": 0.1798954550176859,
    "sampletime": 8.565232953988016,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 132,
    "reward_mean": 1.7862054473340097,
    "reward_max": 2.0794328896921437,
    "reward_min": 1.4718385117647053,
    "reward_std": 0.1433942118020762,
    "timesteps": 39875472,
    "learntime": 0.12226095702499151,
    "sampletime": 8.558012960013002,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 133,
    "reward_mean": 1.396112765336524,
    "reward_max": 2.1078555574993385,
    "reward_min": -7.225593523690341,
    "reward_std": 1.8608446715509206,
    "timesteps": 40235154,
    "learntime": 0.17737600510008633,
    "sampletime": 8.472348453011364,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 134,
    "reward_mean": 1.8419248241991086,
    "reward_max": 2.0382854638155536,
    "reward_min": 1.61050197012567,
    "reward_std": 0.12268399515533061,
    "timesteps": 40595874,
    "learntime": 0.12696117092855275,
    "sampletime": 8.52909278916195,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 135,
    "reward_mean": 1.775701977954959,
    "reward_max": 2.1045957732195437,
    "reward_min": 1.3033063511918008,
    "reward_std": 0.14149689885237235,
    "timesteps": 40956594,
    "learntime": 0.18469901802018285,
    "sampletime": 8.585826792987064,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 136,
    "reward_mean": 1.8048925785729417,
    "reward_max": 2.0657866028050176,
    "reward_min": 1.1496230139869785,
    "reward_std": 0.15766350867180495,
    "timesteps": 41317314,
    "learntime": 0.12920088786631823,
    "sampletime": 8.601081063970923,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 137,
    "reward_mean": 1.7751762933525654,
    "reward_max": 2.0644842351003603,
    "reward_min": 1.4031587210907162,
    "reward_std": 0.1584096341381679,
    "timesteps": 41678034,
    "learntime": 0.17410891805775464,
    "sampletime": 8.463817144045606,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 138,
    "reward_mean": 1.784280032193482,
    "reward_max": 2.295124737761037,
    "reward_min": 1.3954696832289377,
    "reward_std": 0.16871433205752479,
    "timesteps": 42038754,
    "learntime": 0.12765484885312617,
    "sampletime": 8.521642605075613,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 139,
    "reward_mean": 1.7879035264614567,
    "reward_max": 2.0722914818589624,
    "reward_min": 1.4163876529289101,
    "reward_std": 0.14743518210016962,
    "timesteps": 42399474,
    "learntime": 0.17179322196170688,
    "sampletime": 8.688201775075868,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 140,
    "reward_mean": 1.8066980332634235,
    "reward_max": 2.1623375027892022,
    "reward_min": 1.3385461158921081,
    "reward_std": 0.1673493757272423,
    "timesteps": 42760194,
    "learntime": 0.11494525498710573,
    "sampletime": 8.536354829091579,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 141,
    "reward_mean": 1.930593738766068,
    "reward_max": 2.2314051161132107,
    "reward_min": 1.6562074320862628,
    "reward_std": 0.13719826149110653,
    "timesteps": 43120914,
    "learntime": 0.17071748594753444,
    "sampletime": 8.638038425939158,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 142,
    "reward_mean": 1.812280337870279,
    "reward_max": 2.304144229313044,
    "reward_min": 1.3865188243657791,
    "reward_std": 0.15464246442822646,
    "timesteps": 43481634,
    "learntime": 0.12352993106469512,
    "sampletime": 8.590476931072772,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 143,
    "reward_mean": 1.4100071742215299,
    "reward_max": 2.20927278873701,
    "reward_min": -7.266487552406036,
    "reward_std": 1.7850084742638506,
    "timesteps": 43841154,
    "learntime": 0.1840642609167844,
    "sampletime": 8.555872352793813,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 144,
    "reward_mean": 1.813212084056762,
    "reward_max": 2.1963545659220673,
    "reward_min": 1.384708443504869,
    "reward_std": 0.15831254405844783,
    "timesteps": 44201874,
    "learntime": 0.1247467880602926,
    "sampletime": 8.566809304989874,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 145,
    "reward_mean": 1.7447219623649866,
    "reward_max": 2.105597976892371,
    "reward_min": 1.339036614972759,
    "reward_std": 0.16782338226241256,
    "timesteps": 44562594,
    "learntime": 0.16714868205599487,
    "sampletime": 8.544526963029057,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 146,
    "reward_mean": 1.81647539631136,
    "reward_max": 2.1367224395737217,
    "reward_min": 1.4211420690831273,
    "reward_std": 0.14262607660152263,
    "timesteps": 44923314,
    "learntime": 0.12036608112975955,
    "sampletime": 8.504015169804916,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 147,
    "reward_mean": 1.80448620569031,
    "reward_max": 2.2326774464348658,
    "reward_min": 1.4802137719022774,
    "reward_std": 0.15915584937565516,
    "timesteps": 45284034,
    "learntime": 0.19361694296821952,
    "sampletime": 8.500962910009548,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 148,
    "reward_mean": 1.3586959026783076,
    "reward_max": 2.307150808755648,
    "reward_min": -7.217648367592397,
    "reward_std": 1.8870853803963779,
    "timesteps": 45643593,
    "learntime": 0.13140891795046628,
    "sampletime": 8.715070206904784,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 149,
    "reward_mean": 1.7456451385345648,
    "reward_max": 2.2725174848367713,
    "reward_min": 1.2727821347705828,
    "reward_std": 0.1851092113244081,
    "timesteps": 46004313,
    "learntime": 0.18043749686330557,
    "sampletime": 8.582750889007002,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 150,
    "reward_mean": 1.3753365597756373,
    "reward_max": 2.03437508468447,
    "reward_min": -7.332755242797168,
    "reward_std": 1.883358673308476,
    "timesteps": 46363860,
    "learntime": 0.1327419988811016,
    "sampletime": 8.532177264802158,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 151,
    "reward_mean": 1.7184150739438915,
    "reward_max": 2.1862367217812158,
    "reward_min": 1.4404832661650366,
    "reward_std": 0.14673885902980138,
    "timesteps": 46724580,
    "learntime": 0.1794945620931685,
    "sampletime": 8.516058815876022,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 152,
    "reward_mean": 1.4561514125565402,
    "reward_max": 2.311653241684378,
    "reward_min": -7.310572289874089,
    "reward_std": 1.9363148937023542,
    "timesteps": 47084064,
    "learntime": 0.12035759910941124,
    "sampletime": 8.533736798912287,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 153,
    "reward_mean": 1.4706756497595639,
    "reward_max": 2.167780963224104,
    "reward_min": -7.019393686586147,
    "reward_std": 1.822297098086111,
    "timesteps": 47443665,
    "learntime": 0.17151457001455128,
    "sampletime": 8.463870455045253,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 154,
    "reward_mean": 1.768962130666477,
    "reward_max": 2.121673132053037,
    "reward_min": 1.496391346819243,
    "reward_std": 0.14183930780645343,
    "timesteps": 47804385,
    "learntime": 0.12195979012176394,
    "sampletime": 8.495140329003334,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 155,
    "reward_mean": 1.7808284233691296,
    "reward_max": 2.164449692137579,
    "reward_min": 1.3653991033141992,
    "reward_std": 0.14705033230553324,
    "timesteps": 48165105,
    "learntime": 0.1858552440535277,
    "sampletime": 8.56068432983011,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 156,
    "reward_mean": 1.8242908676837444,
    "reward_max": 2.1420392146136473,
    "reward_min": 1.2997861741512813,
    "reward_std": 0.16518073961172833,
    "timesteps": 48525825,
    "learntime": 0.12566597410477698,
    "sampletime": 8.522995411185548,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 157,
    "reward_mean": 1.8089089924937873,
    "reward_max": 2.2216031368192137,
    "reward_min": 1.5020883734299166,
    "reward_std": 0.13876427835718222,
    "timesteps": 48886545,
    "learntime": 0.17206957004964352,
    "sampletime": 8.685893065063283,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 158,
    "reward_mean": 1.8288847985877825,
    "reward_max": 2.2037483959169455,
    "reward_min": 1.3316251814972129,
    "reward_std": 0.18490642851643846,
    "timesteps": 49247265,
    "learntime": 0.11466319998726249,
    "sampletime": 8.539661965100095,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 159,
    "reward_mean": 1.8437067968493102,
    "reward_max": 2.103134929329492,
    "reward_min": 1.52851125384746,
    "reward_std": 0.1361606507260455,
    "timesteps": 49607985,
    "learntime": 0.16302868211641908,
    "sampletime": 8.532249930081889,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 160,
    "reward_mean": 1.82464729228552,
    "reward_max": 2.1831490748039784,
    "reward_min": 1.4245330864919874,
    "reward_std": 0.16987085396339557,
    "timesteps": 49968705,
    "learntime": 0.12308350810781121,
    "sampletime": 8.627692811889574,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 161,
    "reward_mean": 1.3767746615807182,
    "reward_max": 2.1834035331072883,
    "reward_min": -7.119546635884261,
    "reward_std": 1.8737834115931664,
    "timesteps": 50328261,
    "learntime": 0.1637155411299318,
    "sampletime": 8.602898909943178,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 162,
    "reward_mean": 1.7456695787635912,
    "reward_max": 2.091242304214656,
    "reward_min": 1.472778058000482,
    "reward_std": 0.13840703095030849,
    "timesteps": 50688981,
    "learntime": 0.13533892203122377,
    "sampletime": 8.535997366067022,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 163,
    "reward_mean": 1.814272975146143,
    "reward_max": 2.208903115766587,
    "reward_min": 1.4482499478617652,
    "reward_std": 0.14078033135560147,
    "timesteps": 51049701,
    "learntime": 0.16150732897222042,
    "sampletime": 8.550060102948919,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 164,
    "reward_mean": 1.38945321796791,
    "reward_max": 2.2257564013473714,
    "reward_min": -7.233096079982001,
    "reward_std": 1.8473473387762118,
    "timesteps": 51409242,
    "learntime": 0.11382962996140122,
    "sampletime": 8.586119625950232,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 165,
    "reward_mean": 1.4339745075798531,
    "reward_max": 2.1043467300196137,
    "reward_min": -7.3497854483350915,
    "reward_std": 1.8745880831640571,
    "timesteps": 51768696,
    "learntime": 0.1941043371334672,
    "sampletime": 8.500110771972686,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 166,
    "reward_mean": 1.4147149312635303,
    "reward_max": 2.13529224056401,
    "reward_min": -7.281291344054892,
    "reward_std": 1.846101229370237,
    "timesteps": 52128171,
    "learntime": 0.13237448781728745,
    "sampletime": 8.579010931076482,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 167,
    "reward_mean": 1.336050213266669,
    "reward_max": 2.1591368032955347,
    "reward_min": -7.416684472533235,
    "reward_std": 1.9401880237800702,
    "timesteps": 52487646,
    "learntime": 0.17872976791113615,
    "sampletime": 8.465576492017135,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 168,
    "reward_mean": 1.8381485013223635,
    "reward_max": 2.1862140653168085,
    "reward_min": 1.418121518142109,
    "reward_std": 0.15305138050043246,
    "timesteps": 52848366,
    "learntime": 0.1258375879842788,
    "sampletime": 8.512865104014054,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 169,
    "reward_mean": 1.795780583570839,
    "reward_max": 2.0927723826784064,
    "reward_min": 1.4450578463676516,
    "reward_std": 0.15612802049898292,
    "timesteps": 53209086,
    "learntime": 0.18310793489217758,
    "sampletime": 8.599996665958315,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 170,
    "reward_mean": 1.7976071301451144,
    "reward_max": 2.0357036503361665,
    "reward_min": 1.4919193068124095,
    "reward_std": 0.11976982975522477,
    "timesteps": 53569806,
    "learntime": 0.12057686899788678,
    "sampletime": 8.526037578005344,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 171,
    "reward_mean": 1.857412392185919,
    "reward_max": 2.3336088538778803,
    "reward_min": 1.5185861342346663,
    "reward_std": 0.16142326680787802,
    "timesteps": 53930526,
    "learntime": 0.17419116315431893,
    "sampletime": 8.611703005153686,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 172,
    "reward_mean": 1.8017639581272376,
    "reward_max": 2.0640383904489368,
    "reward_min": 1.382925763949361,
    "reward_std": 0.161203521708961,
    "timesteps": 54291246,
    "learntime": 0.12993168085813522,
    "sampletime": 8.485401245998219,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 173,
    "reward_mean": 1.3880431252154017,
    "reward_max": 2.2223448830191024,
    "reward_min": -7.253003590899013,
    "reward_std": 1.8888465290517698,
    "timesteps": 54650832,
    "learntime": 0.1615271980408579,
    "sampletime": 8.516643329057842,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 174,
    "reward_mean": 1.379675254848465,
    "reward_max": 2.230365407472059,
    "reward_min": -7.141001886062001,
    "reward_std": 1.825362870793174,
    "timesteps": 55010418,
    "learntime": 0.12183310813270509,
    "sampletime": 8.658807221101597,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 175,
    "reward_mean": 1.782194417570759,
    "reward_max": 2.085104230710484,
    "reward_min": 1.5368603137515775,
    "reward_std": 0.1214137265419355,
    "timesteps": 55371138,
    "learntime": 0.1797058351803571,
    "sampletime": 8.587088177911937,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 176,
    "reward_mean": 1.840054346538028,
    "reward_max": 2.184071595002683,
    "reward_min": 1.5060031140103183,
    "reward_std": 0.1616008345207717,
    "timesteps": 55731858,
    "learntime": 0.11488743079826236,
    "sampletime": 8.4921563079115,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 177,
    "reward_mean": 1.739214376002944,
    "reward_max": 2.0583406367381483,
    "reward_min": 1.4446914772984596,
    "reward_std": 0.11666887689826844,
    "timesteps": 56092578,
    "learntime": 0.18207426415756345,
    "sampletime": 8.517892543924972,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 178,
    "reward_mean": 0.9940473551046453,
    "reward_max": 2.20066966261815,
    "reward_min": -7.367640744792883,
    "reward_std": 2.646465515041753,
    "timesteps": 56450838,
    "learntime": 0.12235396611504257,
    "sampletime": 8.521205733995885,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 179,
    "reward_mean": 1.7488835818969448,
    "reward_max": 2.162407424777151,
    "reward_min": 1.4123363445021682,
    "reward_std": 0.16565769616457143,
    "timesteps": 56811558,
    "learntime": 0.17852102499455214,
    "sampletime": 8.587602013954893,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 180,
    "reward_mean": 1.941139313588819,
    "reward_max": 2.423711513444273,
    "reward_min": 1.198179451690078,
    "reward_std": 0.2012815913668782,
    "timesteps": 57172278,
    "learntime": 0.13226061407476664,
    "sampletime": 8.48153359699063,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 181,
    "reward_mean": 1.8428971068702653,
    "reward_max": 2.1702572518124432,
    "reward_min": 1.4596220136471914,
    "reward_std": 0.15650157558651673,
    "timesteps": 57532998,
    "learntime": 0.17360827000811696,
    "sampletime": 8.446159322047606,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 182,
    "reward_mean": 1.803825875212515,
    "reward_max": 2.098548610483041,
    "reward_min": 1.465467035304753,
    "reward_std": 0.14116531485492242,
    "timesteps": 57893718,
    "learntime": 0.11962520494125783,
    "sampletime": 8.485351693816483,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 183,
    "reward_mean": 1.8247167029705886,
    "reward_max": 2.373854855255391,
    "reward_min": 1.3964388732653736,
    "reward_std": 0.18931770644398668,
    "timesteps": 58254438,
    "learntime": 0.16860684799030423,
    "sampletime": 8.588153349934146,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 184,
    "reward_mean": 1.7971552199627423,
    "reward_max": 2.092122784527921,
    "reward_min": 1.4574204492550251,
    "reward_std": 0.15515641516046177,
    "timesteps": 58615158,
    "learntime": 0.12534329993650317,
    "sampletime": 8.431680960813537,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 185,
    "reward_mean": 1.7619145150945523,
    "reward_max": 2.1345889256905712,
    "reward_min": 1.432403275961845,
    "reward_std": 0.15189598689091313,
    "timesteps": 58975878,
    "learntime": 0.16645484184846282,
    "sampletime": 8.564397556008771,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 186,
    "reward_mean": 1.7955146902146437,
    "reward_max": 2.2250617234544308,
    "reward_min": 1.327585315852154,
    "reward_std": 0.1779971580685472,
    "timesteps": 59336598,
    "learntime": 0.13218696182593703,
    "sampletime": 8.54085987387225,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 187,
    "reward_mean": 0.9643370940526369,
    "reward_max": 2.1676413180715737,
    "reward_min": -16.23306333382304,
    "reward_std": 3.090500919442468,
    "timesteps": 59694738,
    "learntime": 0.16934689693152905,
    "sampletime": 8.473748804070055,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 188,
    "reward_mean": 1.843970902629449,
    "reward_max": 2.232618503310457,
    "reward_min": 1.2024677752580637,
    "reward_std": 0.14694846383260252,
    "timesteps": 60055458,
    "learntime": 0.12789623718708754,
    "sampletime": 8.55590479890816,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 189,
    "reward_mean": 1.438626316266694,
    "reward_max": 2.1920461307163324,
    "reward_min": -7.05656140849566,
    "reward_std": 1.8787122452594043,
    "timesteps": 60415038,
    "learntime": 0.17537058587186038,
    "sampletime": 8.50613274006173,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 190,
    "reward_mean": 1.8003614040613294,
    "reward_max": 2.1307290005691617,
    "reward_min": 1.4516806826048325,
    "reward_std": 0.1430602450432688,
    "timesteps": 60775758,
    "learntime": 0.12591588404029608,
    "sampletime": 8.525154292816296,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 191,
    "reward_mean": 1.8935786640192105,
    "reward_max": 2.239351525070199,
    "reward_min": 1.4762412850913158,
    "reward_std": 0.15249481814256122,
    "timesteps": 61136478,
    "learntime": 0.16280202195048332,
    "sampletime": 8.497775582130998,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 192,
    "reward_mean": 1.8211057812223947,
    "reward_max": 2.1308118023973086,
    "reward_min": 1.407323477719202,
    "reward_std": 0.15053746497610604,
    "timesteps": 61497198,
    "learntime": 0.12412668112665415,
    "sampletime": 8.77243497595191,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 193,
    "reward_mean": 1.8136385148420868,
    "reward_max": 2.246201240916197,
    "reward_min": 1.4279015812913463,
    "reward_std": 0.15634043053514152,
    "timesteps": 61857918,
    "learntime": 0.1707876401487738,
    "sampletime": 8.559699794044718,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 194,
    "reward_mean": 1.8352354240911017,
    "reward_max": 2.170137421799481,
    "reward_min": 1.5230916516156834,
    "reward_std": 0.13548493492551916,
    "timesteps": 62218638,
    "learntime": 0.12287086015567183,
    "sampletime": 8.54728086409159,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 195,
    "reward_mean": 1.7962941283274119,
    "reward_max": 2.0462366108421848,
    "reward_min": 1.426633709333887,
    "reward_std": 0.14304229733013857,
    "timesteps": 62579358,
    "learntime": 0.1839157440699637,
    "sampletime": 8.543769126059487,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 196,
    "reward_mean": 1.8891849571059613,
    "reward_max": 2.2095627857594398,
    "reward_min": 1.5888619691152879,
    "reward_std": 0.13244648842996848,
    "timesteps": 62940078,
    "learntime": 0.12897380907088518,
    "sampletime": 8.525503888959065,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 197,
    "reward_mean": 1.8008798907012835,
    "reward_max": 2.0791545808694494,
    "reward_min": 1.4432123305812217,
    "reward_std": 0.12341858134894929,
    "timesteps": 63300798,
    "learntime": 0.18052863702178001,
    "sampletime": 8.612105409847572,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 198,
    "reward_mean": 1.8495113891358108,
    "reward_max": 2.142212590861491,
    "reward_min": 1.5779542286148445,
    "reward_std": 0.1293027805688972,
    "timesteps": 63661518,
    "learntime": 0.13147471798583865,
    "sampletime": 8.46550588007085,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 199,
    "reward_mean": 1.729832639503781,
    "reward_max": 2.0070939108898664,
    "reward_min": 1.367628741522571,
    "reward_std": 0.13839381977789564,
    "timesteps": 64022238,
    "learntime": 0.17805308289825916,
    "sampletime": 8.56131983594969,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 200,
    "reward_mean": 1.7936615234266307,
    "reward_max": 2.2368619737248827,
    "reward_min": 1.5117909162589844,
    "reward_std": 0.1463512363509587,
    "timesteps": 64382958,
    "learntime": 0.1239479009527713,
    "sampletime": 8.449791233986616,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 201,
    "reward_mean": 1.7970548136938835,
    "reward_max": 2.088431702472006,
    "reward_min": 1.5223393923220223,
    "reward_std": 0.13182592909762542,
    "timesteps": 64743678,
    "learntime": 0.16778693604283035,
    "sampletime": 8.45619313698262,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 202,
    "reward_mean": 1.8210082057407964,
    "reward_max": 2.1213621693622704,
    "reward_min": 1.286707993124074,
    "reward_std": 0.14834075912649353,
    "timesteps": 65104398,
    "learntime": 0.12854465004056692,
    "sampletime": 8.664192517986521,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 203,
    "reward_mean": 1.8824992755721925,
    "reward_max": 2.190121228214895,
    "reward_min": 1.5322229433157986,
    "reward_std": 0.14834913157334328,
    "timesteps": 65465118,
    "learntime": 0.17621937301009893,
    "sampletime": 8.472562509821728,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 204,
    "reward_mean": 1.5118467176575328,
    "reward_max": 2.312593747607684,
    "reward_min": -15.817833192477174,
    "reward_std": 2.4047607510443876,
    "timesteps": 65824659,
    "learntime": 0.11735494714230299,
    "sampletime": 8.523087266134098,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 205,
    "reward_mean": 1.8219972967676483,
    "reward_max": 2.2115239608890844,
    "reward_min": 1.4123195222152072,
    "reward_std": 0.14463140850492306,
    "timesteps": 66185379,
    "learntime": 0.16607279004529119,
    "sampletime": 8.54185909498483,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 206,
    "reward_mean": 1.8109988726480393,
    "reward_max": 2.117082428081296,
    "reward_min": 1.4749290332953051,
    "reward_std": 0.13176622508884583,
    "timesteps": 66546099,
    "learntime": 0.12747109006159008,
    "sampletime": 8.572771712904796,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 207,
    "reward_mean": 1.7930909653605012,
    "reward_max": 2.0361301999981856,
    "reward_min": 1.424054882376255,
    "reward_std": 0.1495074657238873,
    "timesteps": 66906819,
    "learntime": 0.1841404689475894,
    "sampletime": 8.541452476987615,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 208,
    "reward_mean": 1.7765636957756525,
    "reward_max": 2.263867376665022,
    "reward_min": 1.4222747506520872,
    "reward_std": 0.15876267154559331,
    "timesteps": 67267539,
    "learntime": 0.12920241197571158,
    "sampletime": 8.467285040067509,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 209,
    "reward_mean": 1.800006052862534,
    "reward_max": 2.213274839716781,
    "reward_min": 1.4300650380953965,
    "reward_std": 0.1587018300562845,
    "timesteps": 67628259,
    "learntime": 0.18110575387254357,
    "sampletime": 8.594852017005906,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 210,
    "reward_mean": 1.4442006792800355,
    "reward_max": 2.2166616543139672,
    "reward_min": -6.389626278029435,
    "reward_std": 1.6978692186445579,
    "timesteps": 67987785,
    "learntime": 0.13492027902975678,
    "sampletime": 8.57284750090912,
    "best_max_mean": 1.8438424855624782,
    "best_max": 2.4353959641779146
  },
  {
    "gen": 211,
    "reward_mean": 1.8571361908933444,
    "reward_max": 2.5008536224010025,
    "reward_min": 1.4168670149167246,
    "reward_std": 0.18417548588837432,
    "timesteps": 68348505,
    "learntime": 0.17465296504087746,
    "sampletime": 8.51114888000302,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 212,
    "reward_mean": 1.7742812194164788,
    "reward_max": 2.0662467588783406,
    "reward_min": 1.4039031575622622,
    "reward_std": 0.15180997394648685,
    "timesteps": 68709225,
    "learntime": 0.12410874804481864,
    "sampletime": 8.540415704948828,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 213,
    "reward_mean": 1.7878241848349448,
    "reward_max": 2.1512389482918954,
    "reward_min": 1.4979766208932461,
    "reward_std": 0.13612409920164842,
    "timesteps": 69069945,
    "learntime": 0.1738894700538367,
    "sampletime": 8.51954998797737,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 214,
    "reward_mean": 1.8009985356434177,
    "reward_max": 2.138454180288435,
    "reward_min": 1.4709307801668066,
    "reward_std": 0.1458350430630285,
    "timesteps": 69430665,
    "learntime": 0.12232508487068117,
    "sampletime": 8.542694268980995,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 215,
    "reward_mean": 1.804381515841359,
    "reward_max": 2.105239201434109,
    "reward_min": 1.5170896030013485,
    "reward_std": 0.14172318259416064,
    "timesteps": 69791385,
    "learntime": 0.1679512991104275,
    "sampletime": 8.658445690060034,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 216,
    "reward_mean": 1.7971331299644318,
    "reward_max": 2.1268260571823396,
    "reward_min": 1.4459605244214084,
    "reward_std": 0.15078468860968006,
    "timesteps": 70152105,
    "learntime": 0.12418349809013307,
    "sampletime": 8.69150291197002,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 217,
    "reward_mean": 1.8374961479520833,
    "reward_max": 2.2238097263845797,
    "reward_min": 1.4415362016532292,
    "reward_std": 0.15249705550787637,
    "timesteps": 70512825,
    "learntime": 0.16788075515069067,
    "sampletime": 8.522272040136158,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 218,
    "reward_mean": 1.8301323946077694,
    "reward_max": 2.316788171530899,
    "reward_min": 1.3928435012154876,
    "reward_std": 0.1466548666497507,
    "timesteps": 70873545,
    "learntime": 0.13062542397528887,
    "sampletime": 8.51691354997456,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 219,
    "reward_mean": 1.8425919407412958,
    "reward_max": 2.3037858625290064,
    "reward_min": 1.5015549384115696,
    "reward_std": 0.1715394819132894,
    "timesteps": 71234265,
    "learntime": 0.1588424078654498,
    "sampletime": 8.49535301188007,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 220,
    "reward_mean": 1.8329055517740787,
    "reward_max": 2.2128609895219338,
    "reward_min": 1.507759234924431,
    "reward_std": 0.14912174726101352,
    "timesteps": 71594985,
    "learntime": 0.12455009599216282,
    "sampletime": 8.475464405026287,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 221,
    "reward_mean": 1.811927478874959,
    "reward_max": 2.3212294674718357,
    "reward_min": 1.3863395554274587,
    "reward_std": 0.16421797879918876,
    "timesteps": 71955705,
    "learntime": 0.16665365686640143,
    "sampletime": 8.521113150985911,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 222,
    "reward_mean": 1.77288316021279,
    "reward_max": 2.222392289486542,
    "reward_min": 1.3944918010833596,
    "reward_std": 0.14838376021611627,
    "timesteps": 72316425,
    "learntime": 0.12484028097242117,
    "sampletime": 8.512719501042739,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 223,
    "reward_mean": 1.4404351551425434,
    "reward_max": 2.192269402623145,
    "reward_min": -7.133467654451541,
    "reward_std": 1.9012128052536656,
    "timesteps": 72676047,
    "learntime": 0.18714505806565285,
    "sampletime": 8.639608182944357,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 224,
    "reward_mean": 1.4352509268723224,
    "reward_max": 2.1681692001046446,
    "reward_min": -6.975107722505612,
    "reward_std": 1.8171900516913395,
    "timesteps": 73035927,
    "learntime": 0.12798506091348827,
    "sampletime": 8.63899420411326,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 225,
    "reward_mean": 1.4754693197392992,
    "reward_max": 2.374333402342418,
    "reward_min": -6.522817935490621,
    "reward_std": 1.7601159373110926,
    "timesteps": 73395558,
    "learntime": 0.1779502381104976,
    "sampletime": 8.476911633042619,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 226,
    "reward_mean": 1.830683311083722,
    "reward_max": 2.171123106219577,
    "reward_min": 1.5107280282324849,
    "reward_std": 0.13511821880465802,
    "timesteps": 73756278,
    "learntime": 0.12370419502258301,
    "sampletime": 8.497825975064188,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 227,
    "reward_mean": 1.823913782919739,
    "reward_max": 2.2438724300712516,
    "reward_min": 1.4798992384281553,
    "reward_std": 0.15958756601867305,
    "timesteps": 74116998,
    "learntime": 0.18357693194411695,
    "sampletime": 8.512181590078399,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 228,
    "reward_mean": 1.3242318316595063,
    "reward_max": 2.126766646097441,
    "reward_min": -7.530450365892401,
    "reward_std": 1.950845062690502,
    "timesteps": 74476848,
    "learntime": 0.12654712609946728,
    "sampletime": 8.642634832998738,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 229,
    "reward_mean": 1.788567900310662,
    "reward_max": 2.3639010997770407,
    "reward_min": 1.3110898936151445,
    "reward_std": 0.1748287025625583,
    "timesteps": 74837568,
    "learntime": 0.17892402480356395,
    "sampletime": 8.569070108002052,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 230,
    "reward_mean": 1.7806867836873856,
    "reward_max": 2.288122677919805,
    "reward_min": 1.4271478440231538,
    "reward_std": 0.14549624211679965,
    "timesteps": 75198288,
    "learntime": 0.1228174171410501,
    "sampletime": 8.564304555999115,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 231,
    "reward_mean": 1.7847229850582185,
    "reward_max": 2.0933867803480193,
    "reward_min": 1.4604989152592458,
    "reward_std": 0.151129289247205,
    "timesteps": 75559008,
    "learntime": 0.16603551292791963,
    "sampletime": 8.660404223948717,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 232,
    "reward_mean": 1.7915741839785952,
    "reward_max": 2.2461768525495724,
    "reward_min": 1.386186964499451,
    "reward_std": 0.14952094551493125,
    "timesteps": 75919728,
    "learntime": 0.12449611211195588,
    "sampletime": 8.565269832033664,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 233,
    "reward_mean": 1.8326820413111387,
    "reward_max": 2.1618043127148656,
    "reward_min": 1.474020817937948,
    "reward_std": 0.13436192268400823,
    "timesteps": 76280448,
    "learntime": 0.17170920595526695,
    "sampletime": 8.573937576962635,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 234,
    "reward_mean": 1.808357432132466,
    "reward_max": 2.2418431789256186,
    "reward_min": 1.433409873253282,
    "reward_std": 0.17223961171410007,
    "timesteps": 76641168,
    "learntime": 0.11517993314191699,
    "sampletime": 8.51068010693416,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 235,
    "reward_mean": 1.7571824232012458,
    "reward_max": 2.160232989367971,
    "reward_min": 1.353239358662075,
    "reward_std": 0.1593495641109732,
    "timesteps": 77001888,
    "learntime": 0.1673214379698038,
    "sampletime": 8.549538353923708,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 236,
    "reward_mean": 1.7875701442718968,
    "reward_max": 2.0769699571202636,
    "reward_min": 1.4372981421748199,
    "reward_std": 0.14035327643683868,
    "timesteps": 77362608,
    "learntime": 0.12976327002979815,
    "sampletime": 8.457394904922694,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 237,
    "reward_mean": 1.795078935878461,
    "reward_max": 2.0972457450733386,
    "reward_min": 1.4380526562630531,
    "reward_std": 0.13730051054087494,
    "timesteps": 77723328,
    "learntime": 0.179732735035941,
    "sampletime": 8.539071656996384,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 238,
    "reward_mean": 1.8693440972802393,
    "reward_max": 2.315273136006326,
    "reward_min": 1.622635413696922,
    "reward_std": 0.1307480776834132,
    "timesteps": 78084048,
    "learntime": 0.12118701101280749,
    "sampletime": 8.678669766988605,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 239,
    "reward_mean": 1.8017433175453044,
    "reward_max": 2.295143403473597,
    "reward_min": 1.3826277800884157,
    "reward_std": 0.18704622482634145,
    "timesteps": 78444768,
    "learntime": 0.17499311501160264,
    "sampletime": 8.523890458978713,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 240,
    "reward_mean": 1.8436840268637056,
    "reward_max": 2.1833603916549866,
    "reward_min": 1.4181946678468684,
    "reward_std": 0.16686706346531743,
    "timesteps": 78805488,
    "learntime": 0.12566175987012684,
    "sampletime": 8.498702027834952,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 241,
    "reward_mean": 1.771714759111683,
    "reward_max": 1.983800043321079,
    "reward_min": 1.4564412240861442,
    "reward_std": 0.12629621338297506,
    "timesteps": 79166208,
    "learntime": 0.1749007310718298,
    "sampletime": 8.538293805904686,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 242,
    "reward_mean": 1.858994733838966,
    "reward_max": 2.2362663248698476,
    "reward_min": 1.373707151583703,
    "reward_std": 0.1626443064347829,
    "timesteps": 79526928,
    "learntime": 0.12643218808807433,
    "sampletime": 8.580440855119377,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 243,
    "reward_mean": 1.795040067383468,
    "reward_max": 2.085573627465317,
    "reward_min": 1.2867317700310534,
    "reward_std": 0.16034914971492373,
    "timesteps": 79887648,
    "learntime": 0.1814531448762864,
    "sampletime": 8.450009509921074,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 244,
    "reward_mean": 1.8889420597359354,
    "reward_max": 2.25391548744863,
    "reward_min": 1.5754488510719933,
    "reward_std": 0.16848884471339423,
    "timesteps": 80248368,
    "learntime": 0.12553274701349437,
    "sampletime": 8.552032221108675,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 245,
    "reward_mean": 1.8049524586971177,
    "reward_max": 2.1268959742993676,
    "reward_min": 1.439341181483485,
    "reward_std": 0.14737493293303564,
    "timesteps": 80609088,
    "learntime": 0.17005712701939046,
    "sampletime": 8.540699299890548,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 246,
    "reward_mean": 1.8548513025937297,
    "reward_max": 2.3684361524109097,
    "reward_min": 1.5364342871277237,
    "reward_std": 0.16073015096855145,
    "timesteps": 80969808,
    "learntime": 0.12576656602323055,
    "sampletime": 8.520536614116281,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 247,
    "reward_mean": 1.790945064872996,
    "reward_max": 2.0939921988174306,
    "reward_min": 1.493722614347157,
    "reward_std": 0.147217293814363,
    "timesteps": 81330528,
    "learntime": 0.17682979605160654,
    "sampletime": 8.47143040294759,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 248,
    "reward_mean": 1.76918798397426,
    "reward_max": 2.182189125778454,
    "reward_min": 1.4297864425882088,
    "reward_std": 0.17244055815493245,
    "timesteps": 81691248,
    "learntime": 0.13535324414260685,
    "sampletime": 8.567573645850644,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 249,
    "reward_mean": 1.7757892346356525,
    "reward_max": 2.2254994312110763,
    "reward_min": 1.4306042916423634,
    "reward_std": 0.15896884903232575,
    "timesteps": 82051968,
    "learntime": 0.1659830801654607,
    "sampletime": 8.515321912011132,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 250,
    "reward_mean": 1.3636236002410738,
    "reward_max": 2.0525708882616684,
    "reward_min": -7.121890552912553,
    "reward_std": 1.8573786466707305,
    "timesteps": 82411518,
    "learntime": 0.11763701704330742,
    "sampletime": 8.53164401720278,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 251,
    "reward_mean": 1.764847783898364,
    "reward_max": 2.176120047683877,
    "reward_min": 1.4676811913636285,
    "reward_std": 0.13797940479523071,
    "timesteps": 82772238,
    "learntime": 0.1844027868937701,
    "sampletime": 8.510607521981001,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 252,
    "reward_mean": 1.808566674230489,
    "reward_max": 2.2441556820174946,
    "reward_min": 1.395843884854745,
    "reward_std": 0.16035451936238396,
    "timesteps": 83132958,
    "learntime": 0.1307082730345428,
    "sampletime": 8.659140845062211,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 253,
    "reward_mean": 1.7990504917998011,
    "reward_max": 2.146488002011069,
    "reward_min": 1.490307062567973,
    "reward_std": 0.13474515523236635,
    "timesteps": 83493678,
    "learntime": 0.190902812872082,
    "sampletime": 8.476119032828137,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 254,
    "reward_mean": 1.7832392112415811,
    "reward_max": 2.249575880950665,
    "reward_min": 1.476838157402886,
    "reward_std": 0.15377429484945437,
    "timesteps": 83854398,
    "learntime": 0.13057358097285032,
    "sampletime": 8.574052388779819,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 255,
    "reward_mean": 1.8107249948489357,
    "reward_max": 2.1557598595620298,
    "reward_min": 1.4661660118215472,
    "reward_std": 0.14063681824662472,
    "timesteps": 84215118,
    "learntime": 0.1822392710018903,
    "sampletime": 8.593726543942466,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 256,
    "reward_mean": 1.7535851893119032,
    "reward_max": 2.253267184245594,
    "reward_min": 1.4549244300561048,
    "reward_std": 0.15406554373074544,
    "timesteps": 84575838,
    "learntime": 0.1224207878112793,
    "sampletime": 8.488255101954564,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 257,
    "reward_mean": 1.772796079529246,
    "reward_max": 2.058597084371175,
    "reward_min": 1.4117709306477917,
    "reward_std": 0.13881458136298128,
    "timesteps": 84936558,
    "learntime": 0.17103974195197225,
    "sampletime": 8.517607999965549,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 258,
    "reward_mean": 1.8609553792834626,
    "reward_max": 2.303732894325741,
    "reward_min": 1.5600697874841762,
    "reward_std": 0.15151987657639435,
    "timesteps": 85297278,
    "learntime": 0.12773094791918993,
    "sampletime": 8.500037317862734,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 259,
    "reward_mean": 1.8339252404980968,
    "reward_max": 2.2661710937408652,
    "reward_min": 1.3723343453144248,
    "reward_std": 0.14469995980707845,
    "timesteps": 85657998,
    "learntime": 0.1706884209997952,
    "sampletime": 8.670716524124146,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 260,
    "reward_mean": 1.793164525474498,
    "reward_max": 2.1486918194870186,
    "reward_min": 1.3281637091598797,
    "reward_std": 0.16810548416356758,
    "timesteps": 86018718,
    "learntime": 0.12887348281219602,
    "sampletime": 8.503021238837391,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 261,
    "reward_mean": 1.7806970054074338,
    "reward_max": 2.1105469005450472,
    "reward_min": 1.5051703065647843,
    "reward_std": 0.1399526304891225,
    "timesteps": 86379438,
    "learntime": 0.17664059717208147,
    "sampletime": 8.526201124070212,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 262,
    "reward_mean": 1.8549171949294303,
    "reward_max": 2.2972583723550803,
    "reward_min": 1.5285086320205152,
    "reward_std": 0.15811388257011846,
    "timesteps": 86740158,
    "learntime": 0.12291654804721475,
    "sampletime": 8.52881329599768,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 263,
    "reward_mean": 1.8775675719260558,
    "reward_max": 2.3710778740227583,
    "reward_min": 1.585561034505986,
    "reward_std": 0.16034818967226916,
    "timesteps": 87100878,
    "learntime": 0.17495710193179548,
    "sampletime": 8.479036165867,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 264,
    "reward_mean": 1.8197571454192505,
    "reward_max": 2.336344099892866,
    "reward_min": 1.5036185854974458,
    "reward_std": 0.15730341914998358,
    "timesteps": 87461598,
    "learntime": 0.12815208896063268,
    "sampletime": 8.491233451059088,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 265,
    "reward_mean": 0.9103517976407914,
    "reward_max": 2.09442400062493,
    "reward_min": -7.836862491768307,
    "reward_std": 2.583619083172783,
    "timesteps": 87820038,
    "learntime": 0.17521764198318124,
    "sampletime": 8.373346416978166,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 266,
    "reward_mean": 1.8026218315693865,
    "reward_max": 2.1802470174245348,
    "reward_min": 1.3316910786794092,
    "reward_std": 0.1811288919977156,
    "timesteps": 88180758,
    "learntime": 0.1321260470431298,
    "sampletime": 8.586510627996176,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 267,
    "reward_mean": 1.3974828281256018,
    "reward_max": 2.061259273519017,
    "reward_min": -7.673006397517219,
    "reward_std": 1.9972130768286238,
    "timesteps": 88540425,
    "learntime": 0.18783689010888338,
    "sampletime": 8.479435133980587,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 268,
    "reward_mean": 1.8235095112417767,
    "reward_max": 2.203539260126874,
    "reward_min": 1.4108119816792704,
    "reward_std": 0.1582901524035664,
    "timesteps": 88901145,
    "learntime": 0.1274207029491663,
    "sampletime": 8.603968041948974,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 269,
    "reward_mean": 1.7604906583214315,
    "reward_max": 2.1717418551790715,
    "reward_min": 1.363958090261965,
    "reward_std": 0.1501624726478809,
    "timesteps": 89261865,
    "learntime": 0.1699216968845576,
    "sampletime": 8.456594612915069,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 270,
    "reward_mean": 1.7557197075467967,
    "reward_max": 2.268645917085283,
    "reward_min": 1.3896972421948262,
    "reward_std": 0.16663040920461225,
    "timesteps": 89622585,
    "learntime": 0.12815946992486715,
    "sampletime": 8.53347748098895,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 271,
    "reward_mean": 1.7312582391085471,
    "reward_max": 2.108561460581381,
    "reward_min": 1.2484867052601951,
    "reward_std": 0.15970336567420992,
    "timesteps": 89983305,
    "learntime": 0.16804282693192363,
    "sampletime": 8.639524803962559,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 272,
    "reward_mean": 1.4333913266342702,
    "reward_max": 2.208498814065628,
    "reward_min": -7.338473837693915,
    "reward_std": 1.8820796784388374,
    "timesteps": 90342906,
    "learntime": 0.1268542690668255,
    "sampletime": 8.57563646696508,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 273,
    "reward_mean": 1.7888719766541454,
    "reward_max": 2.3407960325128028,
    "reward_min": 1.35689864644175,
    "reward_std": 0.15329163266947335,
    "timesteps": 90703626,
    "learntime": 0.17465496202930808,
    "sampletime": 8.60349843208678,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 274,
    "reward_mean": 1.825769956238235,
    "reward_max": 2.137097630004227,
    "reward_min": 1.407984763990633,
    "reward_std": 0.15202495557902748,
    "timesteps": 91064346,
    "learntime": 0.13146736682392657,
    "sampletime": 8.493706394219771,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 275,
    "reward_mean": 1.90924868673543,
    "reward_max": 2.2621497645564914,
    "reward_min": 1.5255306838644713,
    "reward_std": 0.13544148503547235,
    "timesteps": 91425066,
    "learntime": 0.16652062512002885,
    "sampletime": 8.661197398090735,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 276,
    "reward_mean": 1.731193872484324,
    "reward_max": 2.125008021700934,
    "reward_min": 1.4593476864974917,
    "reward_std": 0.13392944393474468,
    "timesteps": 91785786,
    "learntime": 0.12374376994557679,
    "sampletime": 8.631802316056564,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 277,
    "reward_mean": 1.7164231891902695,
    "reward_max": 2.039251628715479,
    "reward_min": 1.385380567663972,
    "reward_std": 0.14089005858883707,
    "timesteps": 92146506,
    "learntime": 0.16829925798811018,
    "sampletime": 8.504111198941246,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 278,
    "reward_mean": 1.8488602199546411,
    "reward_max": 2.201267297450224,
    "reward_min": 1.5034855240272422,
    "reward_std": 0.16065414463881372,
    "timesteps": 92507226,
    "learntime": 0.13628524006344378,
    "sampletime": 8.589001465123147,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 279,
    "reward_mean": 1.7837742049520746,
    "reward_max": 2.0615356023269893,
    "reward_min": 1.5063225072773265,
    "reward_std": 0.13794696017235442,
    "timesteps": 92867946,
    "learntime": 0.1761736769694835,
    "sampletime": 8.638546510133892,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 280,
    "reward_mean": 1.849439811953253,
    "reward_max": 2.240117024778471,
    "reward_min": 1.4644301908133008,
    "reward_std": 0.15725818202054717,
    "timesteps": 93228666,
    "learntime": 0.12048121890984476,
    "sampletime": 8.555476143024862,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 281,
    "reward_mean": 1.843861340656517,
    "reward_max": 2.1594567540080507,
    "reward_min": 1.492212367824485,
    "reward_std": 0.13192109505905975,
    "timesteps": 93589386,
    "learntime": 0.18098684400320053,
    "sampletime": 8.54651542706415,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 282,
    "reward_mean": 1.3442343871453364,
    "reward_max": 2.204878960249266,
    "reward_min": -8.03333967149427,
    "reward_std": 2.0771126591178266,
    "timesteps": 93948990,
    "learntime": 0.12428358499892056,
    "sampletime": 8.527824013028294,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 283,
    "reward_mean": 1.7477486010519812,
    "reward_max": 2.1346971991087114,
    "reward_min": 1.281812228608141,
    "reward_std": 0.17336497845050616,
    "timesteps": 94309710,
    "learntime": 0.16494297911413014,
    "sampletime": 8.528371827909723,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 284,
    "reward_mean": 1.7677404827364267,
    "reward_max": 2.167810184068608,
    "reward_min": 1.3480153671028345,
    "reward_std": 0.16308506475099732,
    "timesteps": 94670430,
    "learntime": 0.1248868778347969,
    "sampletime": 8.588634306099266,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 285,
    "reward_mean": 1.3658859901166627,
    "reward_max": 2.0589425296356114,
    "reward_min": -7.182654366503951,
    "reward_std": 1.872060574480305,
    "timesteps": 95030130,
    "learntime": 0.17949233297258615,
    "sampletime": 8.553318188991398,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 286,
    "reward_mean": 1.8683929468326195,
    "reward_max": 2.2437384412931127,
    "reward_min": 1.447718868686048,
    "reward_std": 0.1577977124614683,
    "timesteps": 95390850,
    "learntime": 0.1281370169017464,
    "sampletime": 8.479200147092342,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 287,
    "reward_mean": 1.8088714069938734,
    "reward_max": 2.1191133283763017,
    "reward_min": 1.3868915564140059,
    "reward_std": 0.14933570162467213,
    "timesteps": 95751570,
    "learntime": 0.16645242716185749,
    "sampletime": 8.523949653143063,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 288,
    "reward_mean": 1.791077780195291,
    "reward_max": 2.1262456777516143,
    "reward_min": 1.4547958808252575,
    "reward_std": 0.131556917135316,
    "timesteps": 96112290,
    "learntime": 0.12151472107507288,
    "sampletime": 8.618733894079924,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 289,
    "reward_mean": 1.7847033749713859,
    "reward_max": 2.2734466878887725,
    "reward_min": 1.381951862958497,
    "reward_std": 0.16635187374989785,
    "timesteps": 96473010,
    "learntime": 0.16582446498796344,
    "sampletime": 8.583482936955988,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 290,
    "reward_mean": 1.3561029756300291,
    "reward_max": 2.374852677288631,
    "reward_min": -7.606885436689484,
    "reward_std": 1.9298526999335939,
    "timesteps": 96832503,
    "learntime": 0.11751703708432615,
    "sampletime": 8.43753057392314,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 291,
    "reward_mean": 1.3962530085861309,
    "reward_max": 2.090792578935648,
    "reward_min": -7.237433234462517,
    "reward_std": 1.8957063557630864,
    "timesteps": 97192029,
    "learntime": 0.1792952709365636,
    "sampletime": 8.603292847052217,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 292,
    "reward_mean": 1.8050121910313957,
    "reward_max": 2.2215836568044085,
    "reward_min": 1.354331657773757,
    "reward_std": 0.14889291505651256,
    "timesteps": 97552749,
    "learntime": 0.13019653712399304,
    "sampletime": 8.527013694169,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 293,
    "reward_mean": 1.7924337326823596,
    "reward_max": 2.1580716141104443,
    "reward_min": 1.4368741094058881,
    "reward_std": 0.14701399975379767,
    "timesteps": 97913469,
    "learntime": 0.18257154012098908,
    "sampletime": 8.605643803952262,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 294,
    "reward_mean": 1.8106103797850461,
    "reward_max": 2.232371363982867,
    "reward_min": 1.452422617487944,
    "reward_std": 0.1628216076617334,
    "timesteps": 98274189,
    "learntime": 0.13051587692461908,
    "sampletime": 8.46877209795639,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 295,
    "reward_mean": 1.822919917498628,
    "reward_max": 2.341755945962203,
    "reward_min": 1.5635051079281943,
    "reward_std": 0.1481446356300657,
    "timesteps": 98634909,
    "learntime": 0.17319434601813555,
    "sampletime": 8.461463987827301,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 296,
    "reward_mean": 1.8226905374899642,
    "reward_max": 2.164881212041814,
    "reward_min": 1.443218582380336,
    "reward_std": 0.14240926366818188,
    "timesteps": 98995629,
    "learntime": 0.12243608199059963,
    "sampletime": 8.597500497009605,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 297,
    "reward_mean": 1.341035582362101,
    "reward_max": 2.1032548110057205,
    "reward_min": -7.467996717923546,
    "reward_std": 1.8639055521985004,
    "timesteps": 99355083,
    "learntime": 0.17569679813459516,
    "sampletime": 8.61255441303365,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 298,
    "reward_mean": 1.378849074827383,
    "reward_max": 2.0895831735913144,
    "reward_min": -7.312044562080479,
    "reward_std": 1.8970566499159665,
    "timesteps": 99714663,
    "learntime": 0.11761086294427514,
    "sampletime": 8.466201458824798,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 299,
    "reward_mean": 1.7899827547990976,
    "reward_max": 2.044117443305256,
    "reward_min": 1.4858935056601876,
    "reward_std": 0.12632493380970655,
    "timesteps": 100075383,
    "learntime": 0.18014739314094186,
    "sampletime": 8.527424073079601,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 300,
    "reward_mean": 1.463518628627,
    "reward_max": 2.2460904575718517,
    "reward_min": -6.2320886252483545,
    "reward_std": 1.6638805136554744,
    "timesteps": 100434879,
    "learntime": 0.12369499704800546,
    "sampletime": 8.651155104162171,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 301,
    "reward_mean": 1.3818788452514454,
    "reward_max": 2.2374983945011255,
    "reward_min": -7.413532295193752,
    "reward_std": 1.8611511500309144,
    "timesteps": 100794597,
    "learntime": 0.1617152108810842,
    "sampletime": 8.550365529954433,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 302,
    "reward_mean": 0.5752814372600734,
    "reward_max": 2.178473666076156,
    "reward_min": -16.143620492867548,
    "reward_std": 3.4761241246900334,
    "timesteps": 101151768,
    "learntime": 0.13241406506858766,
    "sampletime": 8.616748573025689,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 303,
    "reward_mean": 1.3708030222959544,
    "reward_max": 2.153588949364182,
    "reward_min": -15.979263749867448,
    "reward_std": 2.464599775024891,
    "timesteps": 101511312,
    "learntime": 0.16705287201330066,
    "sampletime": 8.476718102116138,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 304,
    "reward_mean": 1.8126939788975958,
    "reward_max": 2.1432414176824435,
    "reward_min": 1.4376446398638274,
    "reward_std": 0.157910311468934,
    "timesteps": 101872032,
    "learntime": 0.1260449739638716,
    "sampletime": 8.492053617024794,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 305,
    "reward_mean": 1.8000285941331764,
    "reward_max": 2.082937351891206,
    "reward_min": 1.4618161378153152,
    "reward_std": 0.135598463447623,
    "timesteps": 102232752,
    "learntime": 0.18594055902212858,
    "sampletime": 8.540470825973898,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 306,
    "reward_mean": 1.793591977893295,
    "reward_max": 2.0952150896644297,
    "reward_min": 1.4293329153054661,
    "reward_std": 0.14007220630518658,
    "timesteps": 102593472,
    "learntime": 0.1255239259917289,
    "sampletime": 8.531476157950237,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 307,
    "reward_mean": 1.8486883286853337,
    "reward_max": 2.1516319590575406,
    "reward_min": 1.4173883330676627,
    "reward_std": 0.1457456095336566,
    "timesteps": 102954192,
    "learntime": 0.16767677501775324,
    "sampletime": 8.589976406889036,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 308,
    "reward_mean": 1.8214861327150742,
    "reward_max": 2.1544534385741283,
    "reward_min": 1.5084527878524616,
    "reward_std": 0.1353457550448442,
    "timesteps": 103314912,
    "learntime": 0.12779777916148305,
    "sampletime": 8.461184927960858,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 309,
    "reward_mean": 1.4579583643626997,
    "reward_max": 2.322651483466162,
    "reward_min": -6.4525966052606245,
    "reward_std": 1.7435164119865654,
    "timesteps": 103674531,
    "learntime": 0.16540413303300738,
    "sampletime": 8.46801994019188,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 310,
    "reward_mean": 1.8732687962466321,
    "reward_max": 2.2067097369722544,
    "reward_min": 1.587939740345587,
    "reward_std": 0.13855750751462118,
    "timesteps": 104035251,
    "learntime": 0.12420550687238574,
    "sampletime": 8.626293148146942,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 311,
    "reward_mean": 1.8036621875417351,
    "reward_max": 2.1872390364627448,
    "reward_min": 1.506919445110145,
    "reward_std": 0.11545293302394215,
    "timesteps": 104395971,
    "learntime": 0.18327581183984876,
    "sampletime": 8.511134549975395,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 312,
    "reward_mean": 1.8488645363134524,
    "reward_max": 2.1912449375411462,
    "reward_min": 1.5413742499683076,
    "reward_std": 0.13818337984430507,
    "timesteps": 104756691,
    "learntime": 0.1221742790658027,
    "sampletime": 8.5093224409502,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 313,
    "reward_mean": 1.7810927403939225,
    "reward_max": 2.0921345719576054,
    "reward_min": 1.294925840246968,
    "reward_std": 0.14801931323376513,
    "timesteps": 105117411,
    "learntime": 0.17750611598603427,
    "sampletime": 8.558438825886697,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 314,
    "reward_mean": 1.8050792599999903,
    "reward_max": 2.3381135191293905,
    "reward_min": 1.3603333525275525,
    "reward_std": 0.19138180302257832,
    "timesteps": 105478131,
    "learntime": 0.1245604339055717,
    "sampletime": 8.643992559053004,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 315,
    "reward_mean": 1.3719256124440335,
    "reward_max": 2.174738001016629,
    "reward_min": -6.726783259582149,
    "reward_std": 1.7530785854929052,
    "timesteps": 105837798,
    "learntime": 0.16846703994087875,
    "sampletime": 8.604405564023182,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 316,
    "reward_mean": 1.843603078988881,
    "reward_max": 2.280674756692529,
    "reward_min": 1.4972577681861956,
    "reward_std": 0.16055048565821833,
    "timesteps": 106198518,
    "learntime": 0.1315606909338385,
    "sampletime": 8.46263574482873,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 317,
    "reward_mean": 1.8322164490970505,
    "reward_max": 2.238796521683757,
    "reward_min": 1.4572395806381877,
    "reward_std": 0.14527311953318947,
    "timesteps": 106559238,
    "learntime": 0.17547902697697282,
    "sampletime": 8.57731047901325,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 318,
    "reward_mean": 1.8600414957328382,
    "reward_max": 2.1981052176984504,
    "reward_min": 1.606038658121232,
    "reward_std": 0.12987204545870087,
    "timesteps": 106919958,
    "learntime": 0.1291097430512309,
    "sampletime": 8.503195585915819,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 319,
    "reward_mean": 1.8267169650274342,
    "reward_max": 2.158081208937799,
    "reward_min": 1.5747599185684265,
    "reward_std": 0.12746999288871863,
    "timesteps": 107280678,
    "learntime": 0.1878241270314902,
    "sampletime": 8.600829121889547,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 320,
    "reward_mean": 1.8983809861091725,
    "reward_max": 2.2197879007408923,
    "reward_min": 1.462178990685829,
    "reward_std": 0.1637601735702608,
    "timesteps": 107641398,
    "learntime": 0.1255135831888765,
    "sampletime": 8.495446488028392,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 321,
    "reward_mean": 1.4260418118916467,
    "reward_max": 2.2193983739107863,
    "reward_min": -7.100374048100398,
    "reward_std": 1.8108589098392405,
    "timesteps": 108001116,
    "learntime": 0.17333567002788186,
    "sampletime": 8.561907707015052,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 322,
    "reward_mean": 1.8463943739267679,
    "reward_max": 2.2155673719667384,
    "reward_min": 1.4843307045891607,
    "reward_std": 0.15965186172899506,
    "timesteps": 108361836,
    "learntime": 0.12221472477540374,
    "sampletime": 8.591192250838503,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 323,
    "reward_mean": 1.795688675794087,
    "reward_max": 2.1218115299813096,
    "reward_min": 1.5775461825735042,
    "reward_std": 0.11835660008688606,
    "timesteps": 108722556,
    "learntime": 0.18574527115561068,
    "sampletime": 8.50685383589007,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 324,
    "reward_mean": 1.800788596482719,
    "reward_max": 2.1942804796342497,
    "reward_min": 1.3710564106709833,
    "reward_std": 0.18199573803965846,
    "timesteps": 109083276,
    "learntime": 0.12248206604272127,
    "sampletime": 8.670395615976304,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 325,
    "reward_mean": 1.797354482148562,
    "reward_max": 2.27733017726051,
    "reward_min": 1.312105224300493,
    "reward_std": 0.19050501564828176,
    "timesteps": 109443996,
    "learntime": 0.16328499093651772,
    "sampletime": 8.500114803900942,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 326,
    "reward_mean": 1.8475037647423336,
    "reward_max": 2.209733785906184,
    "reward_min": 1.3557130900338605,
    "reward_std": 0.17321128377743533,
    "timesteps": 109804716,
    "learntime": 0.14186120708473027,
    "sampletime": 8.556706007104367,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 327,
    "reward_mean": 1.7500540690715085,
    "reward_max": 2.1853030877492974,
    "reward_min": 1.2928066765183948,
    "reward_std": 0.17968296852884447,
    "timesteps": 110165436,
    "learntime": 0.18404694902710617,
    "sampletime": 8.47236504801549,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 328,
    "reward_mean": 1.8323166682071519,
    "reward_max": 2.245910514462592,
    "reward_min": 1.4332946862348073,
    "reward_std": 0.16722675650345217,
    "timesteps": 110526156,
    "learntime": 0.12990070017986,
    "sampletime": 8.659187979996204,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 329,
    "reward_mean": 1.7373811356165536,
    "reward_max": 2.102427733342415,
    "reward_min": 1.4200266892183895,
    "reward_std": 0.14547141901878807,
    "timesteps": 110886876,
    "learntime": 0.18925561802461743,
    "sampletime": 8.49909091903828,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 330,
    "reward_mean": 1.7533232499316114,
    "reward_max": 2.0962451136521927,
    "reward_min": 1.4927599390044397,
    "reward_std": 0.14173803525090836,
    "timesteps": 111247596,
    "learntime": 0.1303484111558646,
    "sampletime": 8.579809034010395,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 331,
    "reward_mean": 1.7523895778628853,
    "reward_max": 2.09711208981025,
    "reward_min": 1.437181190178361,
    "reward_std": 0.13022283028032394,
    "timesteps": 111608316,
    "learntime": 0.1752242469228804,
    "sampletime": 8.501484232954681,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 332,
    "reward_mean": 1.770883108495221,
    "reward_max": 2.1007038939095533,
    "reward_min": 1.3935900437927808,
    "reward_std": 0.15574446498819575,
    "timesteps": 111969036,
    "learntime": 0.12805281509645283,
    "sampletime": 8.572387372842059,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 333,
    "reward_mean": 1.8607091829350773,
    "reward_max": 2.2292422371789447,
    "reward_min": 1.5284252799765154,
    "reward_std": 0.15209170473283654,
    "timesteps": 112329756,
    "learntime": 0.17689236300066113,
    "sampletime": 8.653118539834395,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 334,
    "reward_mean": 1.7537708650976758,
    "reward_max": 2.058560087844714,
    "reward_min": 1.4077729717122756,
    "reward_std": 0.14648559432705777,
    "timesteps": 112690476,
    "learntime": 0.11963162990286946,
    "sampletime": 8.485603698994964,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 335,
    "reward_mean": 1.8318694626853138,
    "reward_max": 2.307371112513268,
    "reward_min": 1.4105009759994993,
    "reward_std": 0.15342234302026558,
    "timesteps": 113051196,
    "learntime": 0.1774629659485072,
    "sampletime": 8.590892150998116,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 336,
    "reward_mean": 1.854763269979414,
    "reward_max": 2.1162501339551634,
    "reward_min": 1.598085132841432,
    "reward_std": 0.14397448857159437,
    "timesteps": 113411916,
    "learntime": 0.12213884084485471,
    "sampletime": 8.490649810992181,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 337,
    "reward_mean": 1.7922362146621589,
    "reward_max": 2.150258961482021,
    "reward_min": 1.4207245169531983,
    "reward_std": 0.1496830144005522,
    "timesteps": 113772636,
    "learntime": 0.198357222834602,
    "sampletime": 8.560339926974848,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 338,
    "reward_mean": 1.8056101239452063,
    "reward_max": 2.127704831409957,
    "reward_min": 1.3894881427316252,
    "reward_std": 0.15397840927947154,
    "timesteps": 114133356,
    "learntime": 0.1333978520706296,
    "sampletime": 8.473069443833083,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 339,
    "reward_mean": 1.7702522225794013,
    "reward_max": 2.152960714425495,
    "reward_min": 1.4268982262235055,
    "reward_std": 0.15713949098682145,
    "timesteps": 114494076,
    "learntime": 0.1817350829951465,
    "sampletime": 8.428408639039844,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 340,
    "reward_mean": 1.7588272073490003,
    "reward_max": 2.1151864439651185,
    "reward_min": 1.3753553296829142,
    "reward_std": 0.14592591482162154,
    "timesteps": 114854796,
    "learntime": 0.12964650988578796,
    "sampletime": 8.673967478098348,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 341,
    "reward_mean": 1.787435832078983,
    "reward_max": 2.1512203665774745,
    "reward_min": 1.3725550407314455,
    "reward_std": 0.17087255872550738,
    "timesteps": 115215516,
    "learntime": 0.17437345813959837,
    "sampletime": 8.545234068995342,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 342,
    "reward_mean": 1.7863294691984415,
    "reward_max": 2.0776615133650123,
    "reward_min": 1.5006365265728803,
    "reward_std": 0.1342194500090659,
    "timesteps": 115576236,
    "learntime": 0.13611169205978513,
    "sampletime": 8.461953273974359,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 343,
    "reward_mean": 1.8446266121791561,
    "reward_max": 2.3803342954876494,
    "reward_min": 1.5073505530211442,
    "reward_std": 0.15863706058835958,
    "timesteps": 115936956,
    "learntime": 0.17521873698569834,
    "sampletime": 8.480641593923792,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 344,
    "reward_mean": 1.845942617927944,
    "reward_max": 2.076528194048228,
    "reward_min": 1.5934687075536582,
    "reward_std": 0.1176942421187831,
    "timesteps": 116297676,
    "learntime": 0.12780814594589174,
    "sampletime": 8.594777832971886,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 345,
    "reward_mean": 1.8010891640750692,
    "reward_max": 2.239594246652104,
    "reward_min": 1.1846181470777282,
    "reward_std": 0.17639475132855179,
    "timesteps": 116658396,
    "learntime": 0.18168461904861033,
    "sampletime": 8.547032541129738,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 346,
    "reward_mean": 1.7994379023824718,
    "reward_max": 2.3028487518659477,
    "reward_min": 1.3539841144439464,
    "reward_std": 0.17769246336491587,
    "timesteps": 117019116,
    "learntime": 0.12169515690766275,
    "sampletime": 8.398455049842596,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 347,
    "reward_mean": 0.9758915791161084,
    "reward_max": 2.2879799003917864,
    "reward_min": -7.190777793454334,
    "reward_std": 2.5221658402354996,
    "timesteps": 117377604,
    "learntime": 0.18106532585807145,
    "sampletime": 8.515359311830252,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 348,
    "reward_mean": 1.0082910078214604,
    "reward_max": 2.1780389871241286,
    "reward_min": -7.210386497932524,
    "reward_std": 2.525537119383957,
    "timesteps": 117736092,
    "learntime": 0.13207162683829665,
    "sampletime": 8.518421784974635,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 349,
    "reward_mean": 1.8939671335735886,
    "reward_max": 2.226074272764586,
    "reward_min": 1.506234285243406,
    "reward_std": 0.14988503470090597,
    "timesteps": 118096812,
    "learntime": 0.18669855198822916,
    "sampletime": 8.530283275060356,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 350,
    "reward_mean": 1.8131094992689858,
    "reward_max": 2.1204958227471864,
    "reward_min": 1.5394050332474594,
    "reward_std": 0.1326861716141567,
    "timesteps": 118457532,
    "learntime": 0.12973840301856399,
    "sampletime": 8.525343360845,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 351,
    "reward_mean": 1.8199353330605734,
    "reward_max": 2.2054760273198473,
    "reward_min": 1.2895869749417084,
    "reward_std": 0.16005151612933893,
    "timesteps": 118818252,
    "learntime": 0.18626474495977163,
    "sampletime": 8.46724326792173,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 352,
    "reward_mean": 1.8225398830972686,
    "reward_max": 2.2668144215955786,
    "reward_min": 1.4478681662938342,
    "reward_std": 0.1782585155339628,
    "timesteps": 119178972,
    "learntime": 0.1433713249862194,
    "sampletime": 8.570173356914893,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 353,
    "reward_mean": 1.863780293675303,
    "reward_max": 2.182031833868343,
    "reward_min": 1.515169928041743,
    "reward_std": 0.1459660467922118,
    "timesteps": 119539692,
    "learntime": 0.17498547793366015,
    "sampletime": 8.58980185398832,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 354,
    "reward_mean": 1.460768859129559,
    "reward_max": 2.1297781497494026,
    "reward_min": -6.546874425508029,
    "reward_std": 1.6864715845776075,
    "timesteps": 119899278,
    "learntime": 0.11903322511352599,
    "sampletime": 8.608830051030964,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 355,
    "reward_mean": 1.7991446735898393,
    "reward_max": 2.111402534369984,
    "reward_min": 1.4753808298523305,
    "reward_std": 0.14342469847254036,
    "timesteps": 120259998,
    "learntime": 0.18226339691318572,
    "sampletime": 8.528611392015591,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 356,
    "reward_mean": 1.432562890034724,
    "reward_max": 2.2375709292563504,
    "reward_min": -7.537838671354681,
    "reward_std": 1.9092691708486018,
    "timesteps": 120619506,
    "learntime": 0.1267384949605912,
    "sampletime": 8.54254155117087,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 357,
    "reward_mean": 1.8472182636344505,
    "reward_max": 2.262120691382069,
    "reward_min": 1.5521279392209664,
    "reward_std": 0.13985969272946008,
    "timesteps": 120980226,
    "learntime": 0.17894982802681625,
    "sampletime": 8.569166004192084,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 358,
    "reward_mean": 1.867671946731662,
    "reward_max": 2.223668204358543,
    "reward_min": 1.3987041251349352,
    "reward_std": 0.17047680058192485,
    "timesteps": 121340946,
    "learntime": 0.12094378494657576,
    "sampletime": 8.478069020900875,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 359,
    "reward_mean": 1.8117796885648594,
    "reward_max": 2.118051007529365,
    "reward_min": 1.2011799764480753,
    "reward_std": 0.1733212618056113,
    "timesteps": 121701666,
    "learntime": 0.17980830208398402,
    "sampletime": 8.525643238099292,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 360,
    "reward_mean": 1.7813225466398137,
    "reward_max": 2.1868273950125428,
    "reward_min": 1.426183216968305,
    "reward_std": 0.16710150414436234,
    "timesteps": 122062386,
    "learntime": 0.13183807907626033,
    "sampletime": 8.545534870121628,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 361,
    "reward_mean": 1.7205680264687462,
    "reward_max": 2.1148633135140456,
    "reward_min": 1.4087178571194665,
    "reward_std": 0.15979229134771383,
    "timesteps": 122423106,
    "learntime": 0.180559674045071,
    "sampletime": 8.58450535708107,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 362,
    "reward_mean": 1.761568760787488,
    "reward_max": 2.1228962123015194,
    "reward_min": 1.3881150805844076,
    "reward_std": 0.1603170013524562,
    "timesteps": 122783826,
    "learntime": 0.12447741604410112,
    "sampletime": 8.57165361312218,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 363,
    "reward_mean": 1.783982885959608,
    "reward_max": 2.0944738857287994,
    "reward_min": 1.3724929772204497,
    "reward_std": 0.1562841856656657,
    "timesteps": 123144546,
    "learntime": 0.1651003558654338,
    "sampletime": 8.521797712892294,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 364,
    "reward_mean": 1.8721943919443067,
    "reward_max": 2.2811363571778513,
    "reward_min": 1.4519668630616946,
    "reward_std": 0.17513372726480536,
    "timesteps": 123505266,
    "learntime": 0.12496210122480989,
    "sampletime": 8.499948307871819,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 365,
    "reward_mean": 1.9124739778739186,
    "reward_max": 2.2841357820893076,
    "reward_min": 1.5633805451533647,
    "reward_std": 0.16709931861394847,
    "timesteps": 123865986,
    "learntime": 0.18628804199397564,
    "sampletime": 8.499193494906649,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 366,
    "reward_mean": 1.904764937075857,
    "reward_max": 2.275378459669423,
    "reward_min": 1.5606271436183954,
    "reward_std": 0.14239305024362128,
    "timesteps": 124226706,
    "learntime": 0.13268189900554717,
    "sampletime": 8.592206994071603,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 367,
    "reward_mean": 1.831955293553313,
    "reward_max": 2.1669428271142674,
    "reward_min": 1.4605173592572067,
    "reward_std": 0.14707388115919484,
    "timesteps": 124587426,
    "learntime": 0.17767327395267785,
    "sampletime": 8.46389117394574,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 368,
    "reward_mean": 1.8014616605431928,
    "reward_max": 2.0834145568369418,
    "reward_min": 1.340206241248363,
    "reward_std": 0.18813422881823885,
    "timesteps": 124948146,
    "learntime": 0.1292180900927633,
    "sampletime": 8.554520924109966,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 369,
    "reward_mean": 1.829015993936765,
    "reward_max": 2.253279673223115,
    "reward_min": 1.4725564139485898,
    "reward_std": 0.15340245633667887,
    "timesteps": 125308866,
    "learntime": 0.1735682408325374,
    "sampletime": 8.685168663971126,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 370,
    "reward_mean": 1.742466448300399,
    "reward_max": 2.07425310456363,
    "reward_min": 1.4263945200170056,
    "reward_std": 0.1430987405083343,
    "timesteps": 125669586,
    "learntime": 0.12740169698372483,
    "sampletime": 8.503266895189881,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 371,
    "reward_mean": 1.8202112120888785,
    "reward_max": 2.0464983086285105,
    "reward_min": 1.444580119171982,
    "reward_std": 0.1263455716431111,
    "timesteps": 126030306,
    "learntime": 0.1630370318889618,
    "sampletime": 8.625149013008922,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 372,
    "reward_mean": 1.8804955406514279,
    "reward_max": 2.2265063483624306,
    "reward_min": 1.5432777354197391,
    "reward_std": 0.15170481476218314,
    "timesteps": 126391026,
    "learntime": 0.13198222708888352,
    "sampletime": 8.593322776956484,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 373,
    "reward_mean": 1.4520497615019785,
    "reward_max": 2.2249731711086063,
    "reward_min": -7.2321037196406115,
    "reward_std": 1.8595277893336635,
    "timesteps": 126750567,
    "learntime": 0.18481444800272584,
    "sampletime": 8.4678433930967,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 374,
    "reward_mean": 1.4134622863643789,
    "reward_max": 2.1795177422040553,
    "reward_min": -7.072545703610754,
    "reward_std": 1.8613872238868778,
    "timesteps": 127110108,
    "learntime": 0.12435090611688793,
    "sampletime": 8.468909848015755,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 375,
    "reward_mean": 1.7894630552604984,
    "reward_max": 2.096775256378651,
    "reward_min": 1.5303550423087637,
    "reward_std": 0.12659766861218472,
    "timesteps": 127470828,
    "learntime": 0.17544835689477623,
    "sampletime": 8.55824408098124,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 376,
    "reward_mean": 1.817339320426794,
    "reward_max": 2.0527990025236944,
    "reward_min": 1.30294517086374,
    "reward_std": 0.12500516332149467,
    "timesteps": 127831548,
    "learntime": 0.12497089290991426,
    "sampletime": 8.641761617036536,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 377,
    "reward_mean": 1.7928659255222397,
    "reward_max": 2.210155609391625,
    "reward_min": 1.3882844933541478,
    "reward_std": 0.18680362796681366,
    "timesteps": 128192268,
    "learntime": 0.18840976408682764,
    "sampletime": 8.479685937054455,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 378,
    "reward_mean": 1.8087402929922687,
    "reward_max": 2.160157926408119,
    "reward_min": 1.3766564018301177,
    "reward_std": 0.17268661018820083,
    "timesteps": 128552988,
    "learntime": 0.13035893812775612,
    "sampletime": 8.54350200900808,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 379,
    "reward_mean": 1.795310737386691,
    "reward_max": 2.099672156851735,
    "reward_min": 1.5318363909221542,
    "reward_std": 0.15842459565753222,
    "timesteps": 128913708,
    "learntime": 0.1785328248515725,
    "sampletime": 8.543966800905764,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 380,
    "reward_mean": 0.5760921186143915,
    "reward_max": 2.1420115424658723,
    "reward_min": -25.697340588438127,
    "reward_std": 4.225061956167033,
    "timesteps": 129270444,
    "learntime": 0.13223232701420784,
    "sampletime": 8.493926579132676,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 381,
    "reward_mean": 1.8272133505775314,
    "reward_max": 2.2972915157936784,
    "reward_min": 1.380658861524847,
    "reward_std": 0.1730384839463788,
    "timesteps": 129631164,
    "learntime": 0.1932175310794264,
    "sampletime": 8.58361333119683,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 382,
    "reward_mean": 1.8253174892548065,
    "reward_max": 2.0672414078241332,
    "reward_min": 1.5041636893266408,
    "reward_std": 0.12373428281354633,
    "timesteps": 129991884,
    "learntime": 0.1259637491311878,
    "sampletime": 8.517621379112825,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 383,
    "reward_mean": 1.8884204629897576,
    "reward_max": 2.222984033181228,
    "reward_min": 1.4577945663575027,
    "reward_std": 0.137688730964997,
    "timesteps": 130352604,
    "learntime": 0.1762558571062982,
    "sampletime": 8.643312874017283,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 384,
    "reward_mean": 1.8155887089866896,
    "reward_max": 2.1913204751062096,
    "reward_min": 1.5264147372448233,
    "reward_std": 0.15862097485944757,
    "timesteps": 130713324,
    "learntime": 0.1286018481478095,
    "sampletime": 8.628403363982216,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 385,
    "reward_mean": 1.8505899527986531,
    "reward_max": 2.219964982801517,
    "reward_min": 1.4914445318085405,
    "reward_std": 0.1911063222550624,
    "timesteps": 131074044,
    "learntime": 0.18008634680882096,
    "sampletime": 8.552620522910729,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 386,
    "reward_mean": 1.817745023420657,
    "reward_max": 2.1148028880900984,
    "reward_min": 1.475697896414202,
    "reward_std": 0.1310578231686999,
    "timesteps": 131434764,
    "learntime": 0.1334692439995706,
    "sampletime": 8.403160884976387,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 387,
    "reward_mean": 1.2901866579310322,
    "reward_max": 2.154823141408885,
    "reward_min": -7.444319704222974,
    "reward_std": 1.9287234339804007,
    "timesteps": 131794185,
    "learntime": 0.16862688190303743,
    "sampletime": 8.500467891106382,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 388,
    "reward_mean": 0.9901346376613488,
    "reward_max": 2.0777367466062304,
    "reward_min": -7.162245667765311,
    "reward_std": 2.461296937610108,
    "timesteps": 132152688,
    "learntime": 0.1345267230644822,
    "sampletime": 8.493375418940559,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 389,
    "reward_mean": 1.399726633094629,
    "reward_max": 2.085050548098284,
    "reward_min": -7.139335543044251,
    "reward_std": 1.7873507339174768,
    "timesteps": 132512577,
    "learntime": 0.18456056504510343,
    "sampletime": 8.504838376073167,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 390,
    "reward_mean": 1.4628843062091712,
    "reward_max": 2.1624927689060276,
    "reward_min": -7.006533101464978,
    "reward_std": 1.8147184098334201,
    "timesteps": 132872223,
    "learntime": 0.12352787493728101,
    "sampletime": 8.650138759985566,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 391,
    "reward_mean": 1.8563259891122976,
    "reward_max": 2.135068274631822,
    "reward_min": 1.514265266546066,
    "reward_std": 0.14298476651460157,
    "timesteps": 133232943,
    "learntime": 0.18630768987350166,
    "sampletime": 8.512608801014721,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 392,
    "reward_mean": 1.818810460320234,
    "reward_max": 2.168199707200982,
    "reward_min": 1.5612037155290357,
    "reward_std": 0.12354702452157944,
    "timesteps": 133593663,
    "learntime": 0.12385222292505205,
    "sampletime": 8.518069026991725,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 393,
    "reward_mean": 1.351150891914859,
    "reward_max": 2.151312666030004,
    "reward_min": -7.397369703623667,
    "reward_std": 1.9144639269333181,
    "timesteps": 133953120,
    "learntime": 0.19475967390462756,
    "sampletime": 8.568343676859513,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 394,
    "reward_mean": 1.7278981408484224,
    "reward_max": 2.03454694187332,
    "reward_min": 1.4072600381182485,
    "reward_std": 0.13417219054593701,
    "timesteps": 134313840,
    "learntime": 0.12998190382495522,
    "sampletime": 8.464711847016588,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 395,
    "reward_mean": 1.7342733781894748,
    "reward_max": 2.2179270292752173,
    "reward_min": 1.4150617972481974,
    "reward_std": 0.15941715881739452,
    "timesteps": 134674560,
    "learntime": 0.17864649486728013,
    "sampletime": 8.608126697130501,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 396,
    "reward_mean": 1.799284575655439,
    "reward_max": 2.186313486379124,
    "reward_min": 1.418666644208835,
    "reward_std": 0.1901726597715692,
    "timesteps": 135035280,
    "learntime": 0.1245845309458673,
    "sampletime": 8.521324541885406,
    "best_max_mean": 1.8571361908933444,
    "best_max": 2.5008536224010025
  },
  {
    "gen": 397,
    "reward_mean": 1.845385926277884,
    "reward_max": 2.503494267680003,
    "reward_min": 1.5216491007659971,
    "reward_std": 0.16106948761639972,
    "timesteps": 135396000,
    "learntime": 0.1670812419615686,
    "sampletime": 8.583076352020726,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 398,
    "reward_mean": 1.8359221654546027,
    "reward_max": 2.2811667253245633,
    "reward_min": 1.5117641687393162,
    "reward_std": 0.141979090381927,
    "timesteps": 135756720,
    "learntime": 0.14121039398014545,
    "sampletime": 8.48894289904274,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 399,
    "reward_mean": 1.8976004309510865,
    "reward_max": 2.227894799916407,
    "reward_min": 1.4170453275843136,
    "reward_std": 0.180009940578518,
    "timesteps": 136117440,
    "learntime": 0.16745344083756208,
    "sampletime": 8.462235191138461,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 400,
    "reward_mean": 0.6039479049689145,
    "reward_max": 2.1846577663187996,
    "reward_min": -7.220863086488947,
    "reward_std": 3.0333668341023103,
    "timesteps": 136474590,
    "learntime": 0.1269686131272465,
    "sampletime": 8.534734217915684,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 401,
    "reward_mean": 1.4569492069520438,
    "reward_max": 2.3655026571003765,
    "reward_min": -7.226999125141006,
    "reward_std": 1.8661270756052515,
    "timesteps": 136834125,
    "learntime": 0.16817461792379618,
    "sampletime": 8.470361087005585,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 402,
    "reward_mean": 1.8112371043199043,
    "reward_max": 2.186609824935931,
    "reward_min": 1.4814069851418001,
    "reward_std": 0.14386399072444966,
    "timesteps": 137194845,
    "learntime": 0.1261682480107993,
    "sampletime": 8.567375641083345,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 403,
    "reward_mean": 1.7851193831647492,
    "reward_max": 2.146158099834183,
    "reward_min": 1.1871136552786479,
    "reward_std": 0.19180213681814148,
    "timesteps": 137555565,
    "learntime": 0.1802755689714104,
    "sampletime": 8.510693233227357,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 404,
    "reward_mean": 1.8296954496689328,
    "reward_max": 2.1863517035504376,
    "reward_min": 1.4520093103346865,
    "reward_std": 0.16436927775758645,
    "timesteps": 137916285,
    "learntime": 0.12676354893483222,
    "sampletime": 8.62384215905331,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 405,
    "reward_mean": 1.833768386744198,
    "reward_max": 2.202308571523503,
    "reward_min": 1.4974904477412816,
    "reward_std": 0.14116386638053943,
    "timesteps": 138277005,
    "learntime": 0.1903114791493863,
    "sampletime": 8.472961602034047,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 406,
    "reward_mean": 1.769923799992175,
    "reward_max": 2.131799937312987,
    "reward_min": 1.3857527296188161,
    "reward_std": 0.15804170316221208,
    "timesteps": 138637725,
    "learntime": 0.12363557098433375,
    "sampletime": 8.433175116078928,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 407,
    "reward_mean": 1.7808277319661578,
    "reward_max": 2.2032930035017064,
    "reward_min": 1.4415817195831808,
    "reward_std": 0.1604843948974403,
    "timesteps": 138998445,
    "learntime": 0.19080180884338915,
    "sampletime": 8.663652257993817,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 408,
    "reward_mean": 1.8061779978569912,
    "reward_max": 2.0319503160902603,
    "reward_min": 1.4552500954243528,
    "reward_std": 0.1274217298485902,
    "timesteps": 139359165,
    "learntime": 0.13164333789609373,
    "sampletime": 8.627759668044746,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 409,
    "reward_mean": 1.8443220101768767,
    "reward_max": 2.321797462963411,
    "reward_min": 1.3026377744514082,
    "reward_std": 0.17958246670992045,
    "timesteps": 139719885,
    "learntime": 0.176028398796916,
    "sampletime": 8.525704882806167,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 410,
    "reward_mean": 1.7783507824086322,
    "reward_max": 2.162396350246676,
    "reward_min": 1.342738101717479,
    "reward_std": 0.16298572763622962,
    "timesteps": 140080605,
    "learntime": 0.12779966602101922,
    "sampletime": 8.506773359142244,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 411,
    "reward_mean": 1.844786610551032,
    "reward_max": 2.11925219884054,
    "reward_min": 1.3281840081044414,
    "reward_std": 0.17130233362883704,
    "timesteps": 140441325,
    "learntime": 0.16946718795225024,
    "sampletime": 8.549408721039072,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 412,
    "reward_mean": 1.3605384720551414,
    "reward_max": 2.113259537766376,
    "reward_min": -7.194423373619269,
    "reward_std": 1.882793236630979,
    "timesteps": 140801082,
    "learntime": 0.1232127861585468,
    "sampletime": 8.519208398181945,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 413,
    "reward_mean": 1.8186628495104993,
    "reward_max": 2.16432591166019,
    "reward_min": 1.4945902705173137,
    "reward_std": 0.16519169235544146,
    "timesteps": 141161802,
    "learntime": 0.18783285305835307,
    "sampletime": 8.475641045020893,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 414,
    "reward_mean": 1.7893433971832424,
    "reward_max": 2.0005592852698566,
    "reward_min": 1.4232279841759867,
    "reward_std": 0.1349772813308206,
    "timesteps": 141522522,
    "learntime": 0.12713905493728817,
    "sampletime": 8.648480392061174,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 415,
    "reward_mean": 1.8794174970422044,
    "reward_max": 2.240897806999837,
    "reward_min": 1.405550670192687,
    "reward_std": 0.1712357581903108,
    "timesteps": 141883242,
    "learntime": 0.1785014271736145,
    "sampletime": 8.598309580003843,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 416,
    "reward_mean": 1.829463751811387,
    "reward_max": 2.110420332196303,
    "reward_min": 1.6249072480325877,
    "reward_std": 0.11198767591508955,
    "timesteps": 142243962,
    "learntime": 0.12810824601911008,
    "sampletime": 8.530046445084736,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 417,
    "reward_mean": 1.7962556701749188,
    "reward_max": 2.172931763672647,
    "reward_min": 1.434155738025294,
    "reward_std": 0.13010916091813327,
    "timesteps": 142604682,
    "learntime": 0.1749519279692322,
    "sampletime": 8.55685534607619,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 418,
    "reward_mean": 1.7410151737650987,
    "reward_max": 2.1214882158198036,
    "reward_min": 1.4253891136278511,
    "reward_std": 0.15080946882227947,
    "timesteps": 142965402,
    "learntime": 0.13405061489902437,
    "sampletime": 8.603776731994003,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 419,
    "reward_mean": 1.782528821442911,
    "reward_max": 2.021089863391047,
    "reward_min": 1.4612007014396946,
    "reward_std": 0.13146907775160047,
    "timesteps": 143326122,
    "learntime": 0.16807492496445775,
    "sampletime": 8.55270817107521,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 420,
    "reward_mean": 1.8277187444348626,
    "reward_max": 2.147830317918716,
    "reward_min": 1.508613766502642,
    "reward_std": 0.1506560240321213,
    "timesteps": 143686842,
    "learntime": 0.1317178700119257,
    "sampletime": 8.622430467046797,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 421,
    "reward_mean": 1.755006543429956,
    "reward_max": 2.1236291232203106,
    "reward_min": 1.4419820679027109,
    "reward_std": 0.1483857005991002,
    "timesteps": 144047562,
    "learntime": 0.18316406989470124,
    "sampletime": 8.6268055269029,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 422,
    "reward_mean": 1.8624645588332025,
    "reward_max": 2.222539048382631,
    "reward_min": 1.533981579017231,
    "reward_std": 0.15110213003847117,
    "timesteps": 144408282,
    "learntime": 0.1287109509576112,
    "sampletime": 8.510171309811994,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 423,
    "reward_mean": 1.847177751256784,
    "reward_max": 2.2157677466395467,
    "reward_min": 1.522253973721736,
    "reward_std": 0.15513008288181387,
    "timesteps": 144769002,
    "learntime": 0.19149928400292993,
    "sampletime": 8.472508332924917,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 424,
    "reward_mean": 1.7762755110146613,
    "reward_max": 2.2386156987243613,
    "reward_min": 1.2049577680264691,
    "reward_std": 0.18978704898351223,
    "timesteps": 145129722,
    "learntime": 0.1327743751462549,
    "sampletime": 8.589093073038384,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 425,
    "reward_mean": 1.8555408224517724,
    "reward_max": 2.181295016777259,
    "reward_min": 1.4694875556775076,
    "reward_std": 0.16808803189254456,
    "timesteps": 145490442,
    "learntime": 0.17436722107231617,
    "sampletime": 8.547931205946952,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 426,
    "reward_mean": 1.8521250227000987,
    "reward_max": 2.1571240183777367,
    "reward_min": 1.5131672935165192,
    "reward_std": 0.14645033056229811,
    "timesteps": 145851162,
    "learntime": 0.12305514398030937,
    "sampletime": 8.51617004815489,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 427,
    "reward_mean": 1.866130123109964,
    "reward_max": 2.302741811233288,
    "reward_min": 1.5535513500993432,
    "reward_std": 0.15725985092867498,
    "timesteps": 146211882,
    "learntime": 0.1740696718916297,
    "sampletime": 8.603557150112465,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 428,
    "reward_mean": 1.7971112041038593,
    "reward_max": 2.142255315498471,
    "reward_min": 1.4403002434733507,
    "reward_std": 0.1549753277790252,
    "timesteps": 146572602,
    "learntime": 0.13358537992462516,
    "sampletime": 8.532451831968501,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 429,
    "reward_mean": 1.8497783876690206,
    "reward_max": 2.226837525800375,
    "reward_min": 1.5750543901101766,
    "reward_std": 0.16390517884492545,
    "timesteps": 146933322,
    "learntime": 0.18429381703026593,
    "sampletime": 8.679693444166332,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 430,
    "reward_mean": 1.872093041626593,
    "reward_max": 2.317426286483442,
    "reward_min": 1.5571822957682515,
    "reward_std": 0.15281290330728933,
    "timesteps": 147294042,
    "learntime": 0.12128980387933552,
    "sampletime": 8.599446639884263,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 431,
    "reward_mean": 1.8289397245132808,
    "reward_max": 2.205286923078042,
    "reward_min": 1.5010370251468623,
    "reward_std": 0.16051899628308264,
    "timesteps": 147654762,
    "learntime": 0.17680540308356285,
    "sampletime": 8.527538041118532,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 432,
    "reward_mean": 1.8711866384404585,
    "reward_max": 2.2510371413566923,
    "reward_min": 1.4369284561072333,
    "reward_std": 0.1732600866093032,
    "timesteps": 148015482,
    "learntime": 0.12125297589227557,
    "sampletime": 8.594873568974435,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 433,
    "reward_mean": 1.7867094775281818,
    "reward_max": 2.1785092632120926,
    "reward_min": 1.476760571427416,
    "reward_std": 0.14683615777311934,
    "timesteps": 148376202,
    "learntime": 0.18290801206603646,
    "sampletime": 8.564413843909279,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 434,
    "reward_mean": 1.8261964776135855,
    "reward_max": 2.3477151255744193,
    "reward_min": 1.5279115713624778,
    "reward_std": 0.1589688097384529,
    "timesteps": 148736922,
    "learntime": 0.13918159902095795,
    "sampletime": 8.497521684970707,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 435,
    "reward_mean": 1.7653748198524202,
    "reward_max": 2.165909728630341,
    "reward_min": 1.3950616341352335,
    "reward_std": 0.15410109357423996,
    "timesteps": 149097642,
    "learntime": 0.16114269918762147,
    "sampletime": 8.552986086113378,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 436,
    "reward_mean": 1.7881861486271549,
    "reward_max": 2.2509345725411523,
    "reward_min": 1.2331937866878078,
    "reward_std": 0.1956785056236981,
    "timesteps": 149458362,
    "learntime": 0.12913757213391364,
    "sampletime": 8.666641100076959,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 437,
    "reward_mean": 1.8113454364828763,
    "reward_max": 2.174659888695004,
    "reward_min": 1.2666922276539732,
    "reward_std": 0.170456147351529,
    "timesteps": 149819082,
    "learntime": 0.16122013400308788,
    "sampletime": 8.51807134388946,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 438,
    "reward_mean": 1.4131405091184137,
    "reward_max": 2.0814164894364864,
    "reward_min": -7.285266829319441,
    "reward_std": 1.870810368185366,
    "timesteps": 150178593,
    "learntime": 0.13332255906425416,
    "sampletime": 8.590572309913114,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 439,
    "reward_mean": 1.8929549441947116,
    "reward_max": 2.2626836302968267,
    "reward_min": 1.6027226767247242,
    "reward_std": 0.1399468920275531,
    "timesteps": 150539313,
    "learntime": 0.1804357161745429,
    "sampletime": 8.552994567202404,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 440,
    "reward_mean": 1.9020006724201481,
    "reward_max": 2.3753767007799578,
    "reward_min": 1.3194026875681812,
    "reward_std": 0.19048425488368328,
    "timesteps": 150900033,
    "learntime": 0.13380771107040346,
    "sampletime": 8.649623606121168,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 441,
    "reward_mean": 1.4849950008037602,
    "reward_max": 2.2187254432808685,
    "reward_min": -7.280568367891567,
    "reward_std": 1.9244100142020857,
    "timesteps": 151259604,
    "learntime": 0.16950558498501778,
    "sampletime": 8.54437233810313,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 442,
    "reward_mean": 1.8501454952949046,
    "reward_max": 2.2556150463466147,
    "reward_min": 1.3105344706952242,
    "reward_std": 0.17749088998049148,
    "timesteps": 151620324,
    "learntime": 0.1292219830211252,
    "sampletime": 8.575553399976343,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 443,
    "reward_mean": 1.864146881946933,
    "reward_max": 2.082124603503013,
    "reward_min": 1.447587755662176,
    "reward_std": 0.14072331848952688,
    "timesteps": 151981044,
    "learntime": 0.176541289081797,
    "sampletime": 8.64326200983487,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 444,
    "reward_mean": 1.8423409959054475,
    "reward_max": 2.212582454985361,
    "reward_min": 1.386766776170007,
    "reward_std": 0.16530683631441592,
    "timesteps": 152341764,
    "learntime": 0.13097944599576294,
    "sampletime": 8.489703026833013,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 445,
    "reward_mean": 1.790307146459083,
    "reward_max": 2.076829809029619,
    "reward_min": 1.3682772789810143,
    "reward_std": 0.1644801626298901,
    "timesteps": 152702484,
    "learntime": 0.1747001688927412,
    "sampletime": 8.583926343824714,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 446,
    "reward_mean": 1.781567138599293,
    "reward_max": 2.114509806947103,
    "reward_min": 1.308658814361972,
    "reward_std": 0.16320672973994313,
    "timesteps": 153063204,
    "learntime": 0.1275620840024203,
    "sampletime": 8.535908892052248,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 447,
    "reward_mean": 1.810226477178977,
    "reward_max": 2.178045743829427,
    "reward_min": 1.3721027796577348,
    "reward_std": 0.16083716801489392,
    "timesteps": 153423924,
    "learntime": 0.17247136100195348,
    "sampletime": 8.571892631938681,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 448,
    "reward_mean": 1.022491491262127,
    "reward_max": 2.166695783421648,
    "reward_min": -7.033135375325485,
    "reward_std": 2.535706360021324,
    "timesteps": 153782982,
    "learntime": 0.1300514219328761,
    "sampletime": 8.558075270848349,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 449,
    "reward_mean": 1.910742350295823,
    "reward_max": 2.212636674995968,
    "reward_min": 1.530971326489328,
    "reward_std": 0.1591152284843806,
    "timesteps": 154143702,
    "learntime": 0.1638264451175928,
    "sampletime": 8.608559049200267,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 450,
    "reward_mean": 1.8662084873973113,
    "reward_max": 2.2434981084661536,
    "reward_min": 1.574975491051601,
    "reward_std": 0.15669697689675485,
    "timesteps": 154504422,
    "learntime": 0.13207795098423958,
    "sampletime": 8.693869447801262,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 451,
    "reward_mean": 1.8329230728041779,
    "reward_max": 2.088168111225856,
    "reward_min": 1.381697573632027,
    "reward_std": 0.15107439383509186,
    "timesteps": 154865142,
    "learntime": 0.1769215038511902,
    "sampletime": 8.57313217385672,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 452,
    "reward_mean": 1.7852983360329882,
    "reward_max": 2.201495363964399,
    "reward_min": 1.4630836253539472,
    "reward_std": 0.13261291797244348,
    "timesteps": 155225862,
    "learntime": 0.13497912185266614,
    "sampletime": 8.491910330019891,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 453,
    "reward_mean": 1.9176999853449979,
    "reward_max": 2.3329601526387327,
    "reward_min": 1.500720221595129,
    "reward_std": 0.1560944087253897,
    "timesteps": 155586582,
    "learntime": 0.1752303170505911,
    "sampletime": 8.548996265977621,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 454,
    "reward_mean": 1.806913260779437,
    "reward_max": 2.2671307257595306,
    "reward_min": 1.4146398764516361,
    "reward_std": 0.15842235636089386,
    "timesteps": 155947302,
    "learntime": 0.12065141601487994,
    "sampletime": 8.565264896024019,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 455,
    "reward_mean": 1.4592896592256541,
    "reward_max": 2.0969431459706134,
    "reward_min": -6.507071532978446,
    "reward_std": 1.7079880427328924,
    "timesteps": 156306945,
    "learntime": 0.18764963513240218,
    "sampletime": 8.627227123826742,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 456,
    "reward_mean": 1.476124101622628,
    "reward_max": 2.387127041809654,
    "reward_min": -7.269642911305493,
    "reward_std": 1.852821147718437,
    "timesteps": 156666588,
    "learntime": 0.12303225183859468,
    "sampletime": 8.503162506967783,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 457,
    "reward_mean": 1.8431520182958512,
    "reward_max": 2.2010795193491477,
    "reward_min": 1.574708013329652,
    "reward_std": 0.12788731112614368,
    "timesteps": 157027308,
    "learntime": 0.17874629492871463,
    "sampletime": 8.626975069055334,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 458,
    "reward_mean": 1.749632339448731,
    "reward_max": 2.1635510990921745,
    "reward_min": 1.4244045558708316,
    "reward_std": 0.16741876218039364,
    "timesteps": 157388028,
    "learntime": 0.13320688297972083,
    "sampletime": 8.548940164968371,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 459,
    "reward_mean": 1.7428420730429925,
    "reward_max": 2.050616254684315,
    "reward_min": 1.433953411531434,
    "reward_std": 0.1474344573658999,
    "timesteps": 157748748,
    "learntime": 0.15880286507308483,
    "sampletime": 8.483024087967351,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 460,
    "reward_mean": 1.7896104905219028,
    "reward_max": 2.111802679428805,
    "reward_min": 1.4607581941368546,
    "reward_std": 0.13276236387063706,
    "timesteps": 158109468,
    "learntime": 0.12198500195518136,
    "sampletime": 8.49852656503208,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 461,
    "reward_mean": 1.4097021197821433,
    "reward_max": 2.1056022373368504,
    "reward_min": -7.503513376637731,
    "reward_std": 1.9127744819166772,
    "timesteps": 158468988,
    "learntime": 0.19485527696087956,
    "sampletime": 8.517194752115756,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 462,
    "reward_mean": 1.778207541638975,
    "reward_max": 2.1376220862430517,
    "reward_min": 1.498562401446342,
    "reward_std": 0.1397409378577121,
    "timesteps": 158829708,
    "learntime": 0.12562206899747252,
    "sampletime": 8.639274257933721,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 463,
    "reward_mean": 1.8188944253771548,
    "reward_max": 2.1859164626882586,
    "reward_min": 1.2764960576243898,
    "reward_std": 0.16235409315222102,
    "timesteps": 159190428,
    "learntime": 0.16859451704658568,
    "sampletime": 8.506745524005964,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 464,
    "reward_mean": 1.8275005535324242,
    "reward_max": 2.2510932245527813,
    "reward_min": 1.4414694875471663,
    "reward_std": 0.17832275942769216,
    "timesteps": 159551148,
    "learntime": 0.12867211899720132,
    "sampletime": 8.662169745191932,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 465,
    "reward_mean": 1.3667356814374885,
    "reward_max": 2.2085381346979456,
    "reward_min": -15.903266705064611,
    "reward_std": 2.3970690602836187,
    "timesteps": 159910911,
    "learntime": 0.19330719904974103,
    "sampletime": 8.49902403098531,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 466,
    "reward_mean": 1.8168252235084017,
    "reward_max": 2.13625103998823,
    "reward_min": 1.4140107380790679,
    "reward_std": 0.12599998633219522,
    "timesteps": 160271631,
    "learntime": 0.12495241081342101,
    "sampletime": 8.503250529058278,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 467,
    "reward_mean": 1.7955566990722156,
    "reward_max": 2.109736104252407,
    "reward_min": 1.5434424369284665,
    "reward_std": 0.1368372733184981,
    "timesteps": 160632351,
    "learntime": 0.17349472711794078,
    "sampletime": 8.591371845919639,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 468,
    "reward_mean": 1.8293504842551378,
    "reward_max": 2.10118275741878,
    "reward_min": 1.544750219493198,
    "reward_std": 0.13719382710833938,
    "timesteps": 160993071,
    "learntime": 0.11871915683150291,
    "sampletime": 8.579900664044544,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 469,
    "reward_mean": 1.8778770609380238,
    "reward_max": 2.3162890974181747,
    "reward_min": 1.623021091822725,
    "reward_std": 0.1498032398769382,
    "timesteps": 161353791,
    "learntime": 0.19000016408972442,
    "sampletime": 8.517424657009542,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 470,
    "reward_mean": 1.4016746155533955,
    "reward_max": 2.104175203436169,
    "reward_min": -7.473362346154653,
    "reward_std": 1.873024801088861,
    "timesteps": 161713206,
    "learntime": 0.12407747702673078,
    "sampletime": 8.535760229919106,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 471,
    "reward_mean": 1.782512046509003,
    "reward_max": 2.110082622303292,
    "reward_min": 1.4295693035519668,
    "reward_std": 0.14038393326305404,
    "timesteps": 162073926,
    "learntime": 0.1885042330250144,
    "sampletime": 8.636234782868996,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 472,
    "reward_mean": 1.8520899521489977,
    "reward_max": 2.2463380673976943,
    "reward_min": 1.4995180649778097,
    "reward_std": 0.14833830128109535,
    "timesteps": 162434646,
    "learntime": 0.12369660288095474,
    "sampletime": 8.50502669881098,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 473,
    "reward_mean": 1.401428019675265,
    "reward_max": 2.203326963789546,
    "reward_min": -7.223873628966623,
    "reward_std": 1.8146264335642541,
    "timesteps": 162794283,
    "learntime": 0.16614789911545813,
    "sampletime": 8.577984302071854,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 474,
    "reward_mean": 1.8250116830621081,
    "reward_max": 2.233803696535888,
    "reward_min": 1.4864779343751577,
    "reward_std": 0.14055470933200367,
    "timesteps": 163155003,
    "learntime": 0.12506879004649818,
    "sampletime": 8.482794957933947,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 475,
    "reward_mean": 1.85322679508341,
    "reward_max": 2.121467697545248,
    "reward_min": 1.4528382957285013,
    "reward_std": 0.147042080301814,
    "timesteps": 163515723,
    "learntime": 0.17894094996154308,
    "sampletime": 8.68049112893641,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 476,
    "reward_mean": 1.9211431174990588,
    "reward_max": 2.2423829510161215,
    "reward_min": 1.5954464781812419,
    "reward_std": 0.15358195971210511,
    "timesteps": 163876443,
    "learntime": 0.129455653950572,
    "sampletime": 8.593654511030763,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 477,
    "reward_mean": 1.8696755680294357,
    "reward_max": 2.286012944377335,
    "reward_min": 1.5007142786776184,
    "reward_std": 0.16694269800381908,
    "timesteps": 164237163,
    "learntime": 0.1632466169539839,
    "sampletime": 8.564277786994353,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 478,
    "reward_mean": 1.8281700456012497,
    "reward_max": 2.210022566976309,
    "reward_min": 1.4159469675579712,
    "reward_std": 0.1558844893687174,
    "timesteps": 164597883,
    "learntime": 0.12236122298054397,
    "sampletime": 8.617687122197822,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 479,
    "reward_mean": 1.810080919247025,
    "reward_max": 2.227132198155029,
    "reward_min": 1.4872394617308244,
    "reward_std": 0.15340233483598065,
    "timesteps": 164958603,
    "learntime": 0.1642542420886457,
    "sampletime": 8.530139858834445,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 480,
    "reward_mean": 1.8511791737161771,
    "reward_max": 2.290092264309128,
    "reward_min": 1.475635596829102,
    "reward_std": 0.14201549119920023,
    "timesteps": 165319323,
    "learntime": 0.13260396104305983,
    "sampletime": 8.491038060048595,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 481,
    "reward_mean": 1.8280128215431666,
    "reward_max": 2.1808516951701162,
    "reward_min": 1.4684517388639913,
    "reward_std": 0.152729713338867,
    "timesteps": 165680043,
    "learntime": 0.18126750504598022,
    "sampletime": 8.528024100000039,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 482,
    "reward_mean": 1.8843841867893,
    "reward_max": 2.1670886905786637,
    "reward_min": 1.6544579121885652,
    "reward_std": 0.11457614541889387,
    "timesteps": 166040763,
    "learntime": 0.12095172191038728,
    "sampletime": 8.574882172979414,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 483,
    "reward_mean": 1.7978700031003254,
    "reward_max": 2.1748136166865533,
    "reward_min": 1.3546638840590735,
    "reward_std": 0.15752044448569064,
    "timesteps": 166401483,
    "learntime": 0.18102116184309125,
    "sampletime": 8.670217730104923,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 484,
    "reward_mean": 1.7570654181795993,
    "reward_max": 2.13420245845301,
    "reward_min": 1.4691390946981917,
    "reward_std": 0.1420261557847097,
    "timesteps": 166762203,
    "learntime": 0.13441467308439314,
    "sampletime": 8.509345327038318,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 485,
    "reward_mean": 1.8488415417684907,
    "reward_max": 2.301179449939145,
    "reward_min": 1.3695862981857658,
    "reward_std": 0.19247410409665436,
    "timesteps": 167122923,
    "learntime": 0.16897144494578242,
    "sampletime": 8.50297079095617,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 486,
    "reward_mean": 1.7868766193703878,
    "reward_max": 2.069314354320843,
    "reward_min": 1.4561059711588415,
    "reward_std": 0.15283999752122454,
    "timesteps": 167483643,
    "learntime": 0.1346371618565172,
    "sampletime": 8.49530788208358,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 487,
    "reward_mean": 1.8164716932284304,
    "reward_max": 2.3001071137171487,
    "reward_min": 1.4376345995697168,
    "reward_std": 0.17539414836581146,
    "timesteps": 167844363,
    "learntime": 0.1890070280060172,
    "sampletime": 8.55157014890574,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 488,
    "reward_mean": 1.8668974017899107,
    "reward_max": 2.1360869117973693,
    "reward_min": 1.5700874266807303,
    "reward_std": 0.1404919088027862,
    "timesteps": 168205083,
    "learntime": 0.13268178910948336,
    "sampletime": 8.511333553120494,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 489,
    "reward_mean": 1.8021289093602748,
    "reward_max": 2.1223643366313545,
    "reward_min": 1.4137340645062368,
    "reward_std": 0.15778417611764836,
    "timesteps": 168565803,
    "learntime": 0.18204858200624585,
    "sampletime": 8.515110024018213,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 490,
    "reward_mean": 1.7803308604972592,
    "reward_max": 2.13441148689228,
    "reward_min": 1.2084462635684732,
    "reward_std": 0.15277105029984825,
    "timesteps": 168926523,
    "learntime": 0.13170315884053707,
    "sampletime": 8.66461332817562,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 491,
    "reward_mean": 1.7977632417432763,
    "reward_max": 2.2046117741388787,
    "reward_min": 1.443112694000414,
    "reward_std": 0.15308476184142067,
    "timesteps": 169287243,
    "learntime": 0.18253201083280146,
    "sampletime": 8.541204450186342,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 492,
    "reward_mean": 1.817590240614813,
    "reward_max": 2.2663486189364117,
    "reward_min": 1.5271812274182166,
    "reward_std": 0.1658006706442021,
    "timesteps": 169647963,
    "learntime": 0.12155478610657156,
    "sampletime": 8.509503668174148,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 493,
    "reward_mean": 1.7647961530967726,
    "reward_max": 2.162299499889326,
    "reward_min": 1.5208176929648296,
    "reward_std": 0.15567163600947273,
    "timesteps": 170008683,
    "learntime": 0.18516957690007985,
    "sampletime": 8.51239857985638,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 494,
    "reward_mean": 1.8721326383080117,
    "reward_max": 2.333666788759836,
    "reward_min": 1.2960885731606828,
    "reward_std": 0.18390536132436514,
    "timesteps": 170369403,
    "learntime": 0.13697673100978136,
    "sampletime": 8.492112227948382,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 495,
    "reward_mean": 1.8618201011941369,
    "reward_max": 2.289849747277469,
    "reward_min": 1.4973166779840723,
    "reward_std": 0.1692365710698551,
    "timesteps": 170730123,
    "learntime": 0.18598597194068134,
    "sampletime": 8.499333551852033,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 496,
    "reward_mean": 1.8085360566963322,
    "reward_max": 2.1079808090086725,
    "reward_min": 1.321306196500008,
    "reward_std": 0.1838485315835729,
    "timesteps": 171090843,
    "learntime": 0.13044080697000027,
    "sampletime": 8.573735518148169,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 497,
    "reward_mean": 1.8699657573504873,
    "reward_max": 2.153585511399076,
    "reward_min": 1.4666471201785334,
    "reward_std": 0.1361496973740807,
    "timesteps": 171451563,
    "learntime": 0.1772122229449451,
    "sampletime": 8.64454089407809,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 498,
    "reward_mean": 1.4178875171065197,
    "reward_max": 2.2136277307149443,
    "reward_min": -7.993118378354918,
    "reward_std": 1.9751612449133702,
    "timesteps": 171811230,
    "learntime": 0.13962270296178758,
    "sampletime": 8.58373475400731,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 499,
    "reward_mean": 1.0178577964429576,
    "reward_max": 2.306407309218128,
    "reward_min": -7.698079907582286,
    "reward_std": 2.6135581155783045,
    "timesteps": 172169844,
    "learntime": 0.17541776108555496,
    "sampletime": 8.454011118039489,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 500,
    "reward_mean": 1.3196729052939071,
    "reward_max": 2.0734628964547097,
    "reward_min": -8.087060807449182,
    "reward_std": 2.025332949636949,
    "timesteps": 172529511,
    "learntime": 0.1293613889720291,
    "sampletime": 8.504015240818262,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 501,
    "reward_mean": 1.8818471483296513,
    "reward_max": 2.2343020341200304,
    "reward_min": 1.5218421292374822,
    "reward_std": 0.17385927658413178,
    "timesteps": 172890231,
    "learntime": 0.19157707900740206,
    "sampletime": 8.712695226073265,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 502,
    "reward_mean": 1.8240125569797303,
    "reward_max": 2.0798442504425156,
    "reward_min": 1.5555511592661537,
    "reward_std": 0.11847445159325345,
    "timesteps": 173250951,
    "learntime": 0.12490772898308933,
    "sampletime": 8.528515311190858,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 503,
    "reward_mean": 1.806364002424136,
    "reward_max": 2.2294811586422507,
    "reward_min": 1.4437104402415082,
    "reward_std": 0.14247364255918943,
    "timesteps": 173611671,
    "learntime": 0.18849630001932383,
    "sampletime": 8.577819658908993,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 504,
    "reward_mean": 1.8038551053363676,
    "reward_max": 2.1861020065173764,
    "reward_min": 1.4265758041504075,
    "reward_std": 0.16391464363503655,
    "timesteps": 173972391,
    "learntime": 0.12446496705524623,
    "sampletime": 8.582450755871832,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 505,
    "reward_mean": 1.7997741936959284,
    "reward_max": 1.9847528272393062,
    "reward_min": 1.4034213740075423,
    "reward_std": 0.12715749430752835,
    "timesteps": 174333111,
    "learntime": 0.17857482400722802,
    "sampletime": 8.512321815127507,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 506,
    "reward_mean": 1.8451063008846342,
    "reward_max": 2.2372338625992216,
    "reward_min": 1.5263290163200098,
    "reward_std": 0.1441513564456978,
    "timesteps": 174693831,
    "learntime": 0.12999599101021886,
    "sampletime": 8.55851968494244,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 507,
    "reward_mean": 1.8485748800411614,
    "reward_max": 2.186918554709388,
    "reward_min": 1.4927486772684242,
    "reward_std": 0.149076682257431,
    "timesteps": 175054551,
    "learntime": 0.17859241692349315,
    "sampletime": 8.542808071943,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 508,
    "reward_mean": 1.747396216201353,
    "reward_max": 2.1234326597283744,
    "reward_min": 1.4498371344860468,
    "reward_std": 0.13037661722275917,
    "timesteps": 175415271,
    "learntime": 0.12803742103278637,
    "sampletime": 8.614890206838027,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 509,
    "reward_mean": 1.7972126026485074,
    "reward_max": 2.2684678806161327,
    "reward_min": 1.3888272711880143,
    "reward_std": 0.1660197284755515,
    "timesteps": 175775991,
    "learntime": 0.17965277004987001,
    "sampletime": 8.506991004105657,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 510,
    "reward_mean": 1.76935713293978,
    "reward_max": 2.2026202888695416,
    "reward_min": 1.4460011590792499,
    "reward_std": 0.12987037182792205,
    "timesteps": 176136711,
    "learntime": 0.13327706698328257,
    "sampletime": 8.626318919006735,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 511,
    "reward_mean": 1.7743896898016598,
    "reward_max": 2.1530705094161044,
    "reward_min": 1.2907435277752042,
    "reward_std": 0.15439068470373388,
    "timesteps": 176497431,
    "learntime": 0.16824369016103446,
    "sampletime": 8.550682709086686,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 512,
    "reward_mean": 1.350377883111375,
    "reward_max": 2.0699954428780583,
    "reward_min": -7.011352470172853,
    "reward_std": 1.7858881462330893,
    "timesteps": 176857173,
    "learntime": 0.13380877603776753,
    "sampletime": 8.557365779066458,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 513,
    "reward_mean": 1.7586957592185377,
    "reward_max": 2.2445867663834966,
    "reward_min": 1.2841735158934047,
    "reward_std": 0.1693027405478468,
    "timesteps": 177217893,
    "learntime": 0.17449346603825688,
    "sampletime": 8.585939107928425,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 514,
    "reward_mean": 1.8335661916262767,
    "reward_max": 2.1245368173642216,
    "reward_min": 1.4721927256186682,
    "reward_std": 0.13806126269470118,
    "timesteps": 177578613,
    "learntime": 0.13524443400092423,
    "sampletime": 8.596632226835936,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 515,
    "reward_mean": 1.817045917725433,
    "reward_max": 2.2140929346981744,
    "reward_min": 1.4498941650321757,
    "reward_std": 0.16066389045708074,
    "timesteps": 177939333,
    "learntime": 0.17397643392905593,
    "sampletime": 8.528100006049499,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 516,
    "reward_mean": 1.7957562863631984,
    "reward_max": 2.153690760440164,
    "reward_min": 1.4016762540435788,
    "reward_std": 0.13819279458370826,
    "timesteps": 178300053,
    "learntime": 0.12534699402749538,
    "sampletime": 8.499711177079007,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 517,
    "reward_mean": 1.8677505033022619,
    "reward_max": 2.263257668056403,
    "reward_min": 1.3831131750775947,
    "reward_std": 0.13937999608598217,
    "timesteps": 178660773,
    "learntime": 0.17890901304781437,
    "sampletime": 8.60214183689095,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 518,
    "reward_mean": 1.8439516761578285,
    "reward_max": 2.180724747913901,
    "reward_min": 1.513145460923566,
    "reward_std": 0.1444145230197212,
    "timesteps": 179021493,
    "learntime": 0.12124323192983866,
    "sampletime": 8.604178074048832,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 519,
    "reward_mean": 1.866554931397211,
    "reward_max": 2.097604609621953,
    "reward_min": 1.560181332278361,
    "reward_std": 0.12102622170460198,
    "timesteps": 179382213,
    "learntime": 0.18477410590276122,
    "sampletime": 8.584784780163318,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 520,
    "reward_mean": 1.36227056996729,
    "reward_max": 2.090805250047937,
    "reward_min": -7.162186907099872,
    "reward_std": 1.8726630717490313,
    "timesteps": 179741799,
    "learntime": 0.12890507094562054,
    "sampletime": 8.477555355988443,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 521,
    "reward_mean": 1.799478004051339,
    "reward_max": 2.1413932506129054,
    "reward_min": 1.4782635513546543,
    "reward_std": 0.1586454802284001,
    "timesteps": 180102519,
    "learntime": 0.17666873382404447,
    "sampletime": 8.490216481965035,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 522,
    "reward_mean": 1.7639351053491896,
    "reward_max": 2.0603855711788923,
    "reward_min": 1.2489570835540555,
    "reward_std": 0.15853145874859428,
    "timesteps": 180463239,
    "learntime": 0.13274493697099388,
    "sampletime": 8.578010705066845,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 523,
    "reward_mean": 1.4171179814337918,
    "reward_max": 2.283672785481691,
    "reward_min": -7.2628535076827685,
    "reward_std": 1.8491079711651457,
    "timesteps": 180822714,
    "learntime": 0.17313762800768018,
    "sampletime": 8.458381999051198,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 524,
    "reward_mean": 1.407888726781409,
    "reward_max": 2.322820790965729,
    "reward_min": -6.979638167388853,
    "reward_std": 1.849742253987321,
    "timesteps": 181182258,
    "learntime": 0.11750942491926253,
    "sampletime": 8.56481044110842,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 525,
    "reward_mean": 1.8130337455192538,
    "reward_max": 2.062382125232197,
    "reward_min": 1.4456149966272518,
    "reward_std": 0.13544212227272134,
    "timesteps": 181542978,
    "learntime": 0.17800994496792555,
    "sampletime": 8.591160671785474,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 526,
    "reward_mean": 1.8229119874649249,
    "reward_max": 2.3072138941563662,
    "reward_min": 1.3654366164555514,
    "reward_std": 0.1567497902201478,
    "timesteps": 181903698,
    "learntime": 0.13279903889633715,
    "sampletime": 8.615329814143479,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 527,
    "reward_mean": 1.8261380693489255,
    "reward_max": 2.156739577643967,
    "reward_min": 1.4903089284251259,
    "reward_std": 0.1461981379040883,
    "timesteps": 182264418,
    "learntime": 0.18977338098920882,
    "sampletime": 8.645546702900901,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 528,
    "reward_mean": 1.8708496205744685,
    "reward_max": 2.222177024347753,
    "reward_min": 1.5178618250785332,
    "reward_std": 0.1642494729722729,
    "timesteps": 182625138,
    "learntime": 0.13431306509301066,
    "sampletime": 8.680172066902742,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 529,
    "reward_mean": 1.8302837862679533,
    "reward_max": 2.116918739479978,
    "reward_min": 1.5311853917499456,
    "reward_std": 0.14681473478991428,
    "timesteps": 182985858,
    "learntime": 0.19419762399047613,
    "sampletime": 8.538918290985748,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 530,
    "reward_mean": 1.3750238701369377,
    "reward_max": 2.155181129209163,
    "reward_min": -6.667366567559337,
    "reward_std": 1.7720349893991574,
    "timesteps": 183345672,
    "learntime": 0.12851161207072437,
    "sampletime": 8.563608950935304,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 531,
    "reward_mean": 1.2792360675909604,
    "reward_max": 1.9969467656743314,
    "reward_min": -7.740129986809654,
    "reward_std": 1.968069011335141,
    "timesteps": 183705189,
    "learntime": 0.18385305511765182,
    "sampletime": 8.559608375886455,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 532,
    "reward_mean": 1.3906447564919484,
    "reward_max": 2.2203836335166027,
    "reward_min": -7.175873991031429,
    "reward_std": 1.885219916116609,
    "timesteps": 184064751,
    "learntime": 0.1297385471407324,
    "sampletime": 8.660500654019415,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 533,
    "reward_mean": 1.7550067253207655,
    "reward_max": 2.115713277810505,
    "reward_min": 1.4583213243820465,
    "reward_std": 0.15390940257888217,
    "timesteps": 184425471,
    "learntime": 0.18836540589109063,
    "sampletime": 8.540478837909177,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 534,
    "reward_mean": 1.7705215240048862,
    "reward_max": 2.1553333320268626,
    "reward_min": 1.3176269490539907,
    "reward_std": 0.14971250892613333,
    "timesteps": 184786191,
    "learntime": 0.12829929194413126,
    "sampletime": 8.67700730706565,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 535,
    "reward_mean": 1.8573394476573295,
    "reward_max": 2.1071981018176267,
    "reward_min": 1.3212139969462315,
    "reward_std": 0.13538045372547347,
    "timesteps": 185146911,
    "learntime": 0.17232422903180122,
    "sampletime": 8.51481930888258,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 536,
    "reward_mean": 1.827741415085882,
    "reward_max": 2.1791423563117815,
    "reward_min": 1.4860780439586505,
    "reward_std": 0.15138248380045616,
    "timesteps": 185507631,
    "learntime": 0.1231690610293299,
    "sampletime": 8.599704073974863,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 537,
    "reward_mean": 1.842436004405765,
    "reward_max": 2.2189814803687913,
    "reward_min": 1.3113863777482122,
    "reward_std": 0.1681775011890989,
    "timesteps": 185868351,
    "learntime": 0.16370402998290956,
    "sampletime": 8.621370542095974,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 538,
    "reward_mean": 1.7466366652581553,
    "reward_max": 2.2876586101651104,
    "reward_min": 1.3709797800159622,
    "reward_std": 0.1499984564915846,
    "timesteps": 186229071,
    "learntime": 0.13294903305359185,
    "sampletime": 8.420110254082829,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 539,
    "reward_mean": 1.7102596577069082,
    "reward_max": 2.064197569831526,
    "reward_min": 1.315151706644839,
    "reward_std": 0.15556984505175772,
    "timesteps": 186589791,
    "learntime": 0.17876068502664566,
    "sampletime": 8.56658726092428,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 540,
    "reward_mean": 1.737550072796779,
    "reward_max": 2.0297885416181396,
    "reward_min": 1.4059494611997643,
    "reward_std": 0.1311506782370034,
    "timesteps": 186950511,
    "learntime": 0.13257738295942545,
    "sampletime": 8.727946936152875,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 541,
    "reward_mean": 1.8605642996715348,
    "reward_max": 2.1700691476862874,
    "reward_min": 1.4242824089746537,
    "reward_std": 0.16456860298302048,
    "timesteps": 187311231,
    "learntime": 0.18848801590502262,
    "sampletime": 8.587510674027726,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 542,
    "reward_mean": 1.8037564945336229,
    "reward_max": 2.2564927880885057,
    "reward_min": 1.4999679426958485,
    "reward_std": 0.1451115486302064,
    "timesteps": 187671951,
    "learntime": 0.14321096800267696,
    "sampletime": 8.482196687953547,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 543,
    "reward_mean": 1.4283338091693367,
    "reward_max": 2.058846670428683,
    "reward_min": -7.263147736137568,
    "reward_std": 1.900195213530468,
    "timesteps": 188031453,
    "learntime": 0.1767153108958155,
    "sampletime": 8.481344628147781,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 544,
    "reward_mean": 1.7948914905573496,
    "reward_max": 2.0913258142124174,
    "reward_min": 1.3267504242054782,
    "reward_std": 0.13999035525394612,
    "timesteps": 188392173,
    "learntime": 0.12401579297147691,
    "sampletime": 8.59989147610031,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 545,
    "reward_mean": 1.8281570643112093,
    "reward_max": 2.3676010775351144,
    "reward_min": 1.4728223870783508,
    "reward_std": 0.16070342700306436,
    "timesteps": 188752893,
    "learntime": 0.18289606785401702,
    "sampletime": 8.636941594071686,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 546,
    "reward_mean": 1.863940393723191,
    "reward_max": 2.085293580390773,
    "reward_min": 1.3667481290908492,
    "reward_std": 0.13366711973991882,
    "timesteps": 189113613,
    "learntime": 0.1289571588858962,
    "sampletime": 8.541504762135446,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 547,
    "reward_mean": 1.8645256577431595,
    "reward_max": 2.182993901489073,
    "reward_min": 1.449116940785833,
    "reward_std": 0.1565674061407851,
    "timesteps": 189474333,
    "learntime": 0.1812551231123507,
    "sampletime": 8.5071869881358,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 548,
    "reward_mean": 1.8552031783645573,
    "reward_max": 2.299483663859338,
    "reward_min": 1.4631063025380044,
    "reward_std": 0.19260803425656545,
    "timesteps": 189835053,
    "learntime": 0.13536086585372686,
    "sampletime": 8.581593821989372,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 549,
    "reward_mean": 1.8690327316942352,
    "reward_max": 2.123020745469888,
    "reward_min": 1.480781696371469,
    "reward_std": 0.1512539214523535,
    "timesteps": 190195773,
    "learntime": 0.17354383110068738,
    "sampletime": 8.55762619082816,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 550,
    "reward_mean": 1.8431514767326407,
    "reward_max": 2.239069471707224,
    "reward_min": 1.5495980523895296,
    "reward_std": 0.15752820085201555,
    "timesteps": 190556493,
    "learntime": 0.13057449995540082,
    "sampletime": 8.63745359214954,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 551,
    "reward_mean": 1.7323594218380722,
    "reward_max": 1.9761503499325799,
    "reward_min": 1.3445435219204436,
    "reward_std": 0.1311134165909926,
    "timesteps": 190917213,
    "learntime": 0.19216836290434003,
    "sampletime": 8.5939004230313,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 552,
    "reward_mean": 1.3006882763212644,
    "reward_max": 2.050990708814367,
    "reward_min": -7.152826697248122,
    "reward_std": 1.8737736908188551,
    "timesteps": 191276901,
    "learntime": 0.13515651901252568,
    "sampletime": 8.635291702812538,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 553,
    "reward_mean": 1.7801023509598495,
    "reward_max": 2.17444339645744,
    "reward_min": 1.40814500749746,
    "reward_std": 0.14863676133844708,
    "timesteps": 191637621,
    "learntime": 0.172267802990973,
    "sampletime": 8.61432354687713,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 554,
    "reward_mean": 1.7577843220150433,
    "reward_max": 2.116769027307092,
    "reward_min": 1.3987854451277375,
    "reward_std": 0.15766925999197953,
    "timesteps": 191998341,
    "learntime": 0.1394565710797906,
    "sampletime": 8.526997366221622,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 555,
    "reward_mean": 1.7565487455300064,
    "reward_max": 2.042809523726727,
    "reward_min": 1.428896218271828,
    "reward_std": 0.13912574253683269,
    "timesteps": 192359061,
    "learntime": 0.18336361600086093,
    "sampletime": 8.539995986036956,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 556,
    "reward_mean": 1.8258746603328118,
    "reward_max": 2.1811185801264115,
    "reward_min": 1.5025472879325101,
    "reward_std": 0.14485581488731122,
    "timesteps": 192719781,
    "learntime": 0.1280398650560528,
    "sampletime": 8.541995302774012,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 557,
    "reward_mean": 1.7972938688975146,
    "reward_max": 2.1730216523971033,
    "reward_min": 1.394989098972553,
    "reward_std": 0.15194100965914914,
    "timesteps": 193080501,
    "learntime": 0.16427276795729995,
    "sampletime": 8.549123019911349,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 558,
    "reward_mean": 1.8394147455754575,
    "reward_max": 2.194544048896975,
    "reward_min": 1.472366637558892,
    "reward_std": 0.146817466929172,
    "timesteps": 193441221,
    "learntime": 0.1249001850374043,
    "sampletime": 8.508165747858584,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 559,
    "reward_mean": 1.7884872050728786,
    "reward_max": 2.3377856274495206,
    "reward_min": 1.4165494798928362,
    "reward_std": 0.19003781799127334,
    "timesteps": 193801941,
    "learntime": 0.1872749871108681,
    "sampletime": 8.590797940036282,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 560,
    "reward_mean": 1.413734166596036,
    "reward_max": 2.256990612690004,
    "reward_min": -6.960833976161669,
    "reward_std": 1.837812784482014,
    "timesteps": 194161599,
    "learntime": 0.122284019831568,
    "sampletime": 8.555211161961779,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 561,
    "reward_mean": 1.8226759169558084,
    "reward_max": 2.2066057348045294,
    "reward_min": 1.4633146542420754,
    "reward_std": 0.1687818314915252,
    "timesteps": 194522319,
    "learntime": 0.18259580410085618,
    "sampletime": 8.481411419808865,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 562,
    "reward_mean": 1.837132582567929,
    "reward_max": 2.1407662236809033,
    "reward_min": 1.4602482907022476,
    "reward_std": 0.14655189532446053,
    "timesteps": 194883039,
    "learntime": 0.1302973278798163,
    "sampletime": 8.501232462003827,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 563,
    "reward_mean": 1.3661600794460558,
    "reward_max": 2.057399860342732,
    "reward_min": -6.972427672244411,
    "reward_std": 1.7649550737985422,
    "timesteps": 195242565,
    "learntime": 0.18595895287580788,
    "sampletime": 8.597635743906721,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 564,
    "reward_mean": 1.4211492927943854,
    "reward_max": 2.1663269713965474,
    "reward_min": -7.422871255183552,
    "reward_std": 1.9049693124720861,
    "timesteps": 195602064,
    "learntime": 0.13039177702739835,
    "sampletime": 8.470312444027513,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 565,
    "reward_mean": 1.8016967499879841,
    "reward_max": 2.094044535590164,
    "reward_min": 1.461604949166277,
    "reward_std": 0.13867406017604475,
    "timesteps": 195962784,
    "learntime": 0.18780612596310675,
    "sampletime": 8.487699441844597,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 566,
    "reward_mean": 1.4646894391405385,
    "reward_max": 2.257415161024913,
    "reward_min": -6.888808419956178,
    "reward_std": 1.80974674421337,
    "timesteps": 196322475,
    "learntime": 0.13152015581727028,
    "sampletime": 8.684684378094971,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 567,
    "reward_mean": 0.6175466960413704,
    "reward_max": 2.1857806722594706,
    "reward_min": -7.538074975596942,
    "reward_std": 3.0498629923385594,
    "timesteps": 196680009,
    "learntime": 0.18682894809171557,
    "sampletime": 8.51291049295105,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 568,
    "reward_mean": 1.4102678518833969,
    "reward_max": 2.2991150991601303,
    "reward_min": -6.962859036097532,
    "reward_std": 1.8067912746550394,
    "timesteps": 197039700,
    "learntime": 0.13720919890329242,
    "sampletime": 8.581515023019165,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 569,
    "reward_mean": 1.7775847191692637,
    "reward_max": 2.1448026427745117,
    "reward_min": 1.3236550408101786,
    "reward_std": 0.1740993279477389,
    "timesteps": 197400420,
    "learntime": 0.16170661500655115,
    "sampletime": 8.583186594070867,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 570,
    "reward_mean": 1.4497108988446967,
    "reward_max": 2.1819803650938714,
    "reward_min": -6.9238067751210846,
    "reward_std": 1.8392959305632766,
    "timesteps": 197760087,
    "learntime": 0.1363870231434703,
    "sampletime": 8.554108537966385,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 571,
    "reward_mean": 1.3961602109291102,
    "reward_max": 2.088471622203036,
    "reward_min": -7.109125728112168,
    "reward_std": 1.7742011479998463,
    "timesteps": 198119754,
    "learntime": 0.18051883997395635,
    "sampletime": 8.44557963986881,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 572,
    "reward_mean": 1.754554734242949,
    "reward_max": 2.138685429633671,
    "reward_min": 1.2748194795285288,
    "reward_std": 0.17586841927192648,
    "timesteps": 198480474,
    "learntime": 0.12771791010163724,
    "sampletime": 8.53529862081632,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 573,
    "reward_mean": 1.8322923514299203,
    "reward_max": 2.27569055105524,
    "reward_min": 1.4359902940817502,
    "reward_std": 0.16104116353696032,
    "timesteps": 198841194,
    "learntime": 0.16539859399199486,
    "sampletime": 8.677111571887508,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 574,
    "reward_mean": 1.7879167645083547,
    "reward_max": 2.1477234064994293,
    "reward_min": 1.329282497098159,
    "reward_std": 0.15760253473374283,
    "timesteps": 199201914,
    "learntime": 0.12825640197843313,
    "sampletime": 8.538277701940387,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 575,
    "reward_mean": 1.8015297693163086,
    "reward_max": 2.192535853230055,
    "reward_min": 1.4015319938806678,
    "reward_std": 0.16077332964461988,
    "timesteps": 199562634,
    "learntime": 0.1747529641725123,
    "sampletime": 8.579332223860547,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 576,
    "reward_mean": 1.008214390955045,
    "reward_max": 2.1924991815096933,
    "reward_min": -7.1870841298174755,
    "reward_std": 2.574272841429639,
    "timesteps": 199921479,
    "learntime": 0.13072016509249806,
    "sampletime": 8.514160208869725,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 577,
    "reward_mean": 1.8954752095130762,
    "reward_max": 2.2496917006475,
    "reward_min": 1.5885087646668332,
    "reward_std": 0.14306425139287396,
    "timesteps": 200282199,
    "learntime": 0.17016864009201527,
    "sampletime": 8.607272084103897,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 578,
    "reward_mean": 1.892648842691131,
    "reward_max": 2.2281451189159633,
    "reward_min": 1.5695924089963982,
    "reward_std": 0.1485045201980887,
    "timesteps": 200642919,
    "learntime": 0.1253230799920857,
    "sampletime": 8.549577218014747,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 579,
    "reward_mean": 1.8366784154226052,
    "reward_max": 2.1883323178697136,
    "reward_min": 1.5095164407111652,
    "reward_std": 0.1462902868516682,
    "timesteps": 201003639,
    "learntime": 0.1756567119155079,
    "sampletime": 8.550647462019697,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 580,
    "reward_mean": 1.3845556953717633,
    "reward_max": 2.225006548985909,
    "reward_min": -7.140986553559111,
    "reward_std": 1.8361305630355118,
    "timesteps": 201363159,
    "learntime": 0.13387999101541936,
    "sampletime": 8.596941360039636,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 581,
    "reward_mean": 1.8058596796438635,
    "reward_max": 2.2008765641965304,
    "reward_min": 1.466373751158681,
    "reward_std": 0.14146710675787016,
    "timesteps": 201723879,
    "learntime": 0.1933739702217281,
    "sampletime": 8.509258528007194,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 582,
    "reward_mean": 1.781964006938837,
    "reward_max": 2.0982660866357015,
    "reward_min": 1.4669575679452234,
    "reward_std": 0.1553936002895613,
    "timesteps": 202084599,
    "learntime": 0.13298266590572894,
    "sampletime": 8.581395807908848,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 583,
    "reward_mean": 1.4416566408543847,
    "reward_max": 2.3578147153523505,
    "reward_min": -14.630246362450835,
    "reward_std": 2.315370703760151,
    "timesteps": 202444149,
    "learntime": 0.17894797795452178,
    "sampletime": 8.642715706955642,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 584,
    "reward_mean": 1.7705204877615544,
    "reward_max": 2.162864464522112,
    "reward_min": 1.434524084804718,
    "reward_std": 0.13048468424428789,
    "timesteps": 202804869,
    "learntime": 0.1297090440057218,
    "sampletime": 8.548366446048021,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 585,
    "reward_mean": 1.7630484868588412,
    "reward_max": 2.1454979939612007,
    "reward_min": 1.4769915848155468,
    "reward_std": 0.14790785313708643,
    "timesteps": 203165589,
    "learntime": 0.1865622268524021,
    "sampletime": 8.61428440711461,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 586,
    "reward_mean": 1.7855164740403655,
    "reward_max": 2.2059202744999427,
    "reward_min": 1.454967169239267,
    "reward_std": 0.15141963101221395,
    "timesteps": 203526309,
    "learntime": 0.12639965303242207,
    "sampletime": 8.591559960972518,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 587,
    "reward_mean": 1.7808493419334122,
    "reward_max": 2.189927950999732,
    "reward_min": 1.4658882226371601,
    "reward_std": 0.1146770861763714,
    "timesteps": 203887029,
    "learntime": 0.16754811606369913,
    "sampletime": 8.544739191886038,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 588,
    "reward_mean": 1.8563748716148196,
    "reward_max": 2.2213990671787704,
    "reward_min": 1.4231585233523416,
    "reward_std": 0.16493657180379223,
    "timesteps": 204247749,
    "learntime": 0.1412857691757381,
    "sampletime": 8.56601735111326,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 589,
    "reward_mean": 1.8248577348528618,
    "reward_max": 2.16224907658276,
    "reward_min": 1.4190584756857285,
    "reward_std": 0.17165391815583453,
    "timesteps": 204608469,
    "learntime": 0.17430719593539834,
    "sampletime": 8.671654936857522,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 590,
    "reward_mean": 1.3847799215941015,
    "reward_max": 2.096051202945199,
    "reward_min": -15.884695450131515,
    "reward_std": 2.4294790793391687,
    "timesteps": 204968196,
    "learntime": 0.13502265000715852,
    "sampletime": 8.539151431061327,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 591,
    "reward_mean": 1.7946121196102334,
    "reward_max": 2.225225452227856,
    "reward_min": 1.4508067437228875,
    "reward_std": 0.1568430787033212,
    "timesteps": 205328916,
    "learntime": 0.18002195795997977,
    "sampletime": 8.538590156007558,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 592,
    "reward_mean": 1.8630081639420697,
    "reward_max": 2.2468078043711475,
    "reward_min": 1.5062928490480034,
    "reward_std": 0.17100415961990836,
    "timesteps": 205689636,
    "learntime": 0.13306083297356963,
    "sampletime": 8.660919680958614,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 593,
    "reward_mean": 1.79171542058019,
    "reward_max": 2.340829390713195,
    "reward_min": 1.359795588437749,
    "reward_std": 0.18984416403367954,
    "timesteps": 206050356,
    "learntime": 0.18577154306694865,
    "sampletime": 8.537720734020695,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 594,
    "reward_mean": 1.839555797240433,
    "reward_max": 2.3399020059571,
    "reward_min": 1.3334633031627148,
    "reward_std": 0.17512822095297395,
    "timesteps": 206411076,
    "learntime": 0.1285327230580151,
    "sampletime": 8.50697410106659,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 595,
    "reward_mean": 1.8840383732827486,
    "reward_max": 2.2990537173818875,
    "reward_min": 1.5868347570173078,
    "reward_std": 0.148546903319008,
    "timesteps": 206771796,
    "learntime": 0.17792675993405282,
    "sampletime": 8.495090061798692,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 596,
    "reward_mean": 1.9155203951800504,
    "reward_max": 2.3518206279735403,
    "reward_min": 1.5315054388713276,
    "reward_std": 0.15689630626768283,
    "timesteps": 207132516,
    "learntime": 0.13093196391128004,
    "sampletime": 8.51270632701926,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 597,
    "reward_mean": 1.823437665068632,
    "reward_max": 2.114750667423128,
    "reward_min": 1.4472254150605266,
    "reward_std": 0.16721069262054727,
    "timesteps": 207493236,
    "learntime": 0.20086617791093886,
    "sampletime": 8.562820916064084,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 598,
    "reward_mean": 1.8408148777137376,
    "reward_max": 2.2313513939481027,
    "reward_min": 1.5192180222533551,
    "reward_std": 0.13245411223717304,
    "timesteps": 207853956,
    "learntime": 0.11830184399150312,
    "sampletime": 8.514985241927207,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 599,
    "reward_mean": 1.7625919844523867,
    "reward_max": 2.1055282786385026,
    "reward_min": 1.4278768303774967,
    "reward_std": 0.12582485989891742,
    "timesteps": 208214676,
    "learntime": 0.1864976289216429,
    "sampletime": 8.498155892826617,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 600,
    "reward_mean": 1.7752374109212172,
    "reward_max": 1.9973524682943429,
    "reward_min": 1.5489673076016388,
    "reward_std": 0.12475442724558232,
    "timesteps": 208575396,
    "learntime": 0.13016695203259587,
    "sampletime": 8.608033437049016,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 601,
    "reward_mean": 1.7487129778526078,
    "reward_max": 2.0269318158137697,
    "reward_min": 1.360617895465991,
    "reward_std": 0.1364443548925319,
    "timesteps": 208936116,
    "learntime": 0.1740981969051063,
    "sampletime": 8.544515332905576,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 602,
    "reward_mean": 1.7513469450751304,
    "reward_max": 2.0685973998695366,
    "reward_min": 1.5486715997950236,
    "reward_std": 0.13801521145382506,
    "timesteps": 209296836,
    "learntime": 0.12788097909651697,
    "sampletime": 8.454671027837321,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 603,
    "reward_mean": 1.413493387337597,
    "reward_max": 2.3313444301020345,
    "reward_min": -7.465860246123296,
    "reward_std": 1.952994344200406,
    "timesteps": 209656290,
    "learntime": 0.1331591207999736,
    "sampletime": 8.458185605006292,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 604,
    "reward_mean": 1.4612462284696668,
    "reward_max": 2.192533960894003,
    "reward_min": -7.518600518992326,
    "reward_std": 1.8964662170008995,
    "timesteps": 210015744,
    "learntime": 0.13509115995839238,
    "sampletime": 8.543165716109797,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 605,
    "reward_mean": 1.8229665996943991,
    "reward_max": 2.098810666784681,
    "reward_min": 1.4580828353443338,
    "reward_std": 0.1611727745792663,
    "timesteps": 210376464,
    "learntime": 0.17593728378415108,
    "sampletime": 8.59120398806408,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 606,
    "reward_mean": 1.7447235134285954,
    "reward_max": 2.0794458877344635,
    "reward_min": 1.401401819813392,
    "reward_std": 0.15600160357726114,
    "timesteps": 210737184,
    "learntime": 0.1270641938317567,
    "sampletime": 8.632950466126204,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 607,
    "reward_mean": 1.755988683925143,
    "reward_max": 2.049046002512719,
    "reward_min": 1.4855289468188921,
    "reward_std": 0.14416135728878854,
    "timesteps": 211097904,
    "learntime": 0.12841675709933043,
    "sampletime": 8.559813192812726,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 608,
    "reward_mean": 1.835035460543388,
    "reward_max": 2.1616671462194934,
    "reward_min": 1.4840993433187526,
    "reward_std": 0.14038003927113143,
    "timesteps": 211458624,
    "learntime": 0.13511640205979347,
    "sampletime": 8.593201895011589,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 609,
    "reward_mean": 1.8469427241836187,
    "reward_max": 2.191159961376493,
    "reward_min": 1.4674536850440987,
    "reward_std": 0.16304746982033216,
    "timesteps": 211819344,
    "learntime": 0.12766297603957355,
    "sampletime": 8.612021179171279,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 610,
    "reward_mean": 1.8057755145591277,
    "reward_max": 2.0793021655973067,
    "reward_min": 1.47845923385378,
    "reward_std": 0.13995771892073394,
    "timesteps": 212180064,
    "learntime": 0.12597425002604723,
    "sampletime": 8.4951864448376,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 611,
    "reward_mean": 1.7935608776648688,
    "reward_max": 2.242034716873825,
    "reward_min": 1.4042661483294447,
    "reward_std": 0.17164620268557124,
    "timesteps": 212540784,
    "learntime": 0.12788978009484708,
    "sampletime": 8.628819934092462,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 612,
    "reward_mean": 1.8357749487554784,
    "reward_max": 2.2785634395479426,
    "reward_min": 1.4757711728540877,
    "reward_std": 0.15973690045373692,
    "timesteps": 212901504,
    "learntime": 0.12778224283829331,
    "sampletime": 8.501362613867968,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 613,
    "reward_mean": 1.8317461322291806,
    "reward_max": 2.169506820024583,
    "reward_min": 1.5919999530923412,
    "reward_std": 0.1454522179859064,
    "timesteps": 213262224,
    "learntime": 0.129114804090932,
    "sampletime": 8.517891110153869,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 614,
    "reward_mean": 1.8988206323804027,
    "reward_max": 2.3475153649536256,
    "reward_min": 1.6341194289590613,
    "reward_std": 0.1462344866942046,
    "timesteps": 213622944,
    "learntime": 0.13356443401426077,
    "sampletime": 8.586239736992866,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 615,
    "reward_mean": 1.815399894635822,
    "reward_max": 2.3430523560029646,
    "reward_min": 1.4607398763799915,
    "reward_std": 0.17724480246993232,
    "timesteps": 213983664,
    "learntime": 0.1286012560594827,
    "sampletime": 8.523129090899602,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 616,
    "reward_mean": 1.7703503062886738,
    "reward_max": 2.1209140815190017,
    "reward_min": 1.4411182832845915,
    "reward_std": 0.14714656632841763,
    "timesteps": 214344384,
    "learntime": 0.1272437151055783,
    "sampletime": 8.546050259843469,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 617,
    "reward_mean": 1.8269237901781992,
    "reward_max": 2.117922883678338,
    "reward_min": 1.4535365634963222,
    "reward_std": 0.13234749454086248,
    "timesteps": 214705104,
    "learntime": 0.13138687913306057,
    "sampletime": 8.597257984103635,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 618,
    "reward_mean": 1.8870165164670007,
    "reward_max": 2.190286496879926,
    "reward_min": 1.5840106952977762,
    "reward_std": 0.14479602959820184,
    "timesteps": 215065824,
    "learntime": 0.1312600129749626,
    "sampletime": 8.67210514517501,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 619,
    "reward_mean": 1.9566750899555363,
    "reward_max": 2.464076336286475,
    "reward_min": 1.5233658754044528,
    "reward_std": 0.19197110568580575,
    "timesteps": 215426544,
    "learntime": 0.1305546120274812,
    "sampletime": 8.577338339062408,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 620,
    "reward_mean": 1.9036075115458826,
    "reward_max": 2.2817077470458673,
    "reward_min": 1.5959988510603018,
    "reward_std": 0.15663780078150302,
    "timesteps": 215787264,
    "learntime": 0.12214191281236708,
    "sampletime": 8.553199889138341,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 621,
    "reward_mean": 1.7757850338231445,
    "reward_max": 2.2211214632001357,
    "reward_min": 1.4897929195140005,
    "reward_std": 0.1677097650880994,
    "timesteps": 216147984,
    "learntime": 0.1315195788629353,
    "sampletime": 8.507718122098595,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 622,
    "reward_mean": 1.85021621605076,
    "reward_max": 2.225400336806405,
    "reward_min": 1.4558398920520559,
    "reward_std": 0.17786107762290582,
    "timesteps": 216508704,
    "learntime": 0.14242984494194388,
    "sampletime": 8.6212747360114,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 623,
    "reward_mean": 1.8431354090225576,
    "reward_max": 2.3180939280605823,
    "reward_min": 1.5897972570585066,
    "reward_std": 0.1361717915623311,
    "timesteps": 216869424,
    "learntime": 0.12609734502620995,
    "sampletime": 8.53373958193697,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 624,
    "reward_mean": 1.8168327893813832,
    "reward_max": 2.260832789000837,
    "reward_min": 1.450316360458433,
    "reward_std": 0.16528692507156686,
    "timesteps": 217230144,
    "learntime": 0.13061733613722026,
    "sampletime": 8.64788086200133,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 625,
    "reward_mean": 1.8058573687092547,
    "reward_max": 2.1177152233237106,
    "reward_min": 1.4479005340712503,
    "reward_std": 0.14549995264851126,
    "timesteps": 217590864,
    "learntime": 0.13086818205192685,
    "sampletime": 8.694150784052908,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 626,
    "reward_mean": 1.8206658818978747,
    "reward_max": 2.259095618175649,
    "reward_min": 1.4325950239160132,
    "reward_std": 0.15085714764770447,
    "timesteps": 217951584,
    "learntime": 0.12834407901391387,
    "sampletime": 8.533192160073668,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 627,
    "reward_mean": 1.7955287858799216,
    "reward_max": 2.378519157078256,
    "reward_min": 1.4801150876260651,
    "reward_std": 0.14798004671011725,
    "timesteps": 218312304,
    "learntime": 0.1160633151885122,
    "sampletime": 8.53468052111566,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 628,
    "reward_mean": 1.7660128994526578,
    "reward_max": 2.159029520309007,
    "reward_min": 1.4056423975747396,
    "reward_std": 0.154196575528102,
    "timesteps": 218673024,
    "learntime": 0.1308665459509939,
    "sampletime": 8.604208025150001,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 629,
    "reward_mean": 1.8015300550224183,
    "reward_max": 2.1212639859701112,
    "reward_min": 1.2771470396793563,
    "reward_std": 0.16201028941509404,
    "timesteps": 219033744,
    "learntime": 0.13386667612940073,
    "sampletime": 8.569268195191398,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 630,
    "reward_mean": 1.753569464529559,
    "reward_max": 2.07410588858395,
    "reward_min": 1.490802552842068,
    "reward_std": 0.14078956467718634,
    "timesteps": 219394464,
    "learntime": 0.13559163897298276,
    "sampletime": 8.481103751109913,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 631,
    "reward_mean": 1.7693258401897132,
    "reward_max": 2.143795381247234,
    "reward_min": 1.3951851469358738,
    "reward_std": 0.15398424222132656,
    "timesteps": 219755184,
    "learntime": 0.1314873017836362,
    "sampletime": 8.474432356888428,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 632,
    "reward_mean": 1.8295773950271697,
    "reward_max": 2.187883957868588,
    "reward_min": 1.455766958294339,
    "reward_std": 0.15321575558851933,
    "timesteps": 220115904,
    "learntime": 0.13083525095134974,
    "sampletime": 8.512709407135844,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 633,
    "reward_mean": 1.8590144685920305,
    "reward_max": 2.3429988773634887,
    "reward_min": 1.53748756487656,
    "reward_std": 0.17483356421538046,
    "timesteps": 220476624,
    "learntime": 0.1336466260254383,
    "sampletime": 8.692904411815107,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 634,
    "reward_mean": 1.9160257167053003,
    "reward_max": 2.2417602183184364,
    "reward_min": 1.6478839141006254,
    "reward_std": 0.12669674660790856,
    "timesteps": 220837344,
    "learntime": 0.13278184505179524,
    "sampletime": 8.483762361109257,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 635,
    "reward_mean": 1.4438685678887584,
    "reward_max": 2.172986847510782,
    "reward_min": -7.4709732111995,
    "reward_std": 1.922619711260903,
    "timesteps": 221196876,
    "learntime": 0.12951461388729513,
    "sampletime": 8.522247768007219,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 636,
    "reward_mean": 1.8004324259130238,
    "reward_max": 2.146739297126644,
    "reward_min": 1.4276315602368066,
    "reward_std": 0.15861497719775422,
    "timesteps": 221557596,
    "learntime": 0.13176139816641808,
    "sampletime": 8.533167142886668,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 637,
    "reward_mean": 1.7647622031458456,
    "reward_max": 2.062624563338678,
    "reward_min": 1.3613178502189693,
    "reward_std": 0.15046552184700754,
    "timesteps": 221918316,
    "learntime": 0.12201078794896603,
    "sampletime": 8.536401233868673,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 638,
    "reward_mean": 1.7702072375315554,
    "reward_max": 2.1664382998203595,
    "reward_min": 1.383094376184288,
    "reward_std": 0.16618010803126898,
    "timesteps": 222279036,
    "learntime": 0.12602328415960073,
    "sampletime": 8.536558406893164,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 639,
    "reward_mean": 1.3846498455661997,
    "reward_max": 2.195380764006224,
    "reward_min": -7.43157361686992,
    "reward_std": 1.867663809759805,
    "timesteps": 222638736,
    "learntime": 0.13484423700720072,
    "sampletime": 8.469083303119987,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 640,
    "reward_mean": 1.788251751398926,
    "reward_max": 2.086127815432984,
    "reward_min": 1.4597352684570701,
    "reward_std": 0.14015900032340115,
    "timesteps": 222999456,
    "learntime": 0.139475807081908,
    "sampletime": 8.637981790816411,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 641,
    "reward_mean": 1.7497127037885536,
    "reward_max": 2.1627001243354163,
    "reward_min": 1.3446902489751755,
    "reward_std": 0.15648656639608663,
    "timesteps": 223360176,
    "learntime": 0.1279141609556973,
    "sampletime": 8.510625669034198,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 642,
    "reward_mean": 1.7775910574777567,
    "reward_max": 2.1234867475242463,
    "reward_min": 1.476479665030525,
    "reward_std": 0.16197940088841203,
    "timesteps": 223720896,
    "learntime": 0.1253880551084876,
    "sampletime": 8.604521420085803,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 643,
    "reward_mean": 1.8374143952753743,
    "reward_max": 2.1578297930326573,
    "reward_min": 1.4801605482123577,
    "reward_std": 0.14313981388568064,
    "timesteps": 224081616,
    "learntime": 0.12451046984642744,
    "sampletime": 8.589389618020505,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 644,
    "reward_mean": 1.8710839895894371,
    "reward_max": 2.2339784179498405,
    "reward_min": 1.5827666717355648,
    "reward_std": 0.13671458664928754,
    "timesteps": 224442336,
    "learntime": 0.12930121994577348,
    "sampletime": 8.460060568992049,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 645,
    "reward_mean": 1.8481693701451687,
    "reward_max": 2.343736558722217,
    "reward_min": 1.5140245283731573,
    "reward_std": 0.1762282450913297,
    "timesteps": 224803056,
    "learntime": 0.12329920590855181,
    "sampletime": 8.546718389028683,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 646,
    "reward_mean": 1.8106609940548761,
    "reward_max": 2.1986589929696865,
    "reward_min": 1.481177719963435,
    "reward_std": 0.142032574398367,
    "timesteps": 225163776,
    "learntime": 0.1334156550001353,
    "sampletime": 8.538988054962829,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 647,
    "reward_mean": 1.8284565135771844,
    "reward_max": 2.1719051654686643,
    "reward_min": 1.538445498464471,
    "reward_std": 0.14758789573967457,
    "timesteps": 225524496,
    "learntime": 0.12541563110426068,
    "sampletime": 8.69481793208979,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 648,
    "reward_mean": 1.845741845369828,
    "reward_max": 2.214617479571393,
    "reward_min": 1.472153558358319,
    "reward_std": 0.15380297907946805,
    "timesteps": 225885216,
    "learntime": 0.12282510381191969,
    "sampletime": 8.547447802964598,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 649,
    "reward_mean": 1.7844757454686622,
    "reward_max": 2.1239968094389146,
    "reward_min": 1.370915829052328,
    "reward_std": 0.14955023023979197,
    "timesteps": 226245936,
    "learntime": 0.12965053017251194,
    "sampletime": 8.517475383123383,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 650,
    "reward_mean": 1.8535116889940346,
    "reward_max": 2.3094555412826585,
    "reward_min": 1.5031254282597102,
    "reward_std": 0.18480566863312675,
    "timesteps": 226606656,
    "learntime": 0.1263048150576651,
    "sampletime": 8.634966909885406,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 651,
    "reward_mean": 1.3307015045322954,
    "reward_max": 2.0197148483452043,
    "reward_min": -7.133676736192272,
    "reward_std": 1.8686059626465725,
    "timesteps": 226966278,
    "learntime": 0.12830326217226684,
    "sampletime": 8.558850570116192,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 652,
    "reward_mean": 1.8251597313531107,
    "reward_max": 2.2125958536723322,
    "reward_min": 1.4231759248469809,
    "reward_std": 0.15395452649630603,
    "timesteps": 227326998,
    "learntime": 0.1316431409213692,
    "sampletime": 8.518918173853308,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 653,
    "reward_mean": 1.7902900122260474,
    "reward_max": 2.2565505993693566,
    "reward_min": 1.2447105884255651,
    "reward_std": 0.18325294544218035,
    "timesteps": 227687718,
    "learntime": 0.12833259999752045,
    "sampletime": 8.608603220200166,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 654,
    "reward_mean": 1.759978570528895,
    "reward_max": 2.215016295779078,
    "reward_min": 1.37122572603226,
    "reward_std": 0.16304242406041117,
    "timesteps": 228048438,
    "learntime": 0.12982406304217875,
    "sampletime": 8.62727249902673,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 655,
    "reward_mean": 1.762400937573999,
    "reward_max": 2.2195402629228957,
    "reward_min": 1.330326518105169,
    "reward_std": 0.1830007211470157,
    "timesteps": 228409158,
    "learntime": 0.13120914506725967,
    "sampletime": 8.611209268914536,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 656,
    "reward_mean": 1.7704402996623432,
    "reward_max": 2.1088539574852656,
    "reward_min": 1.3584554218986948,
    "reward_std": 0.1473846274051081,
    "timesteps": 228769878,
    "learntime": 0.1240951509680599,
    "sampletime": 8.4600111390464,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 657,
    "reward_mean": 1.8468656645743518,
    "reward_max": 2.1001482036768997,
    "reward_min": 1.4841575393780415,
    "reward_std": 0.14491552360741766,
    "timesteps": 229130598,
    "learntime": 0.12150440597906709,
    "sampletime": 8.490033959038556,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 658,
    "reward_mean": 1.8294070441566723,
    "reward_max": 2.1934342327824004,
    "reward_min": 1.589785665545299,
    "reward_std": 0.13409738332780952,
    "timesteps": 229491318,
    "learntime": 0.12628014688380063,
    "sampletime": 8.562629256863147,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 659,
    "reward_mean": 1.3646857440715563,
    "reward_max": 2.128812896144207,
    "reward_min": -7.315671457856135,
    "reward_std": 1.9082890581479786,
    "timesteps": 229850919,
    "learntime": 0.1364049781113863,
    "sampletime": 8.58649168908596,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 660,
    "reward_mean": 0.9388403866169637,
    "reward_max": 2.1243634897568175,
    "reward_min": -7.397133919413937,
    "reward_std": 2.5618664896534544,
    "timesteps": 230209401,
    "learntime": 0.13131943112239242,
    "sampletime": 8.569002574076876,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 661,
    "reward_mean": 1.346564921095803,
    "reward_max": 2.2945304360553993,
    "reward_min": -6.927357249843863,
    "reward_std": 1.7468643787737248,
    "timesteps": 230569002,
    "learntime": 0.12199788517318666,
    "sampletime": 8.542169090127572,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 662,
    "reward_mean": 1.772558366610908,
    "reward_max": 2.1920353653875972,
    "reward_min": 1.4340660375180743,
    "reward_std": 0.16512025214443815,
    "timesteps": 230929722,
    "learntime": 0.1285983370617032,
    "sampletime": 8.552598607027903,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 663,
    "reward_mean": 1.8510609511594986,
    "reward_max": 2.36518509515074,
    "reward_min": 1.4826233641978197,
    "reward_std": 0.16390649285196468,
    "timesteps": 231290442,
    "learntime": 0.1250912679824978,
    "sampletime": 8.52022926718928,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 664,
    "reward_mean": 1.8388450624862256,
    "reward_max": 2.236919591325035,
    "reward_min": 1.4857279454302998,
    "reward_std": 0.1549961923593186,
    "timesteps": 231651162,
    "learntime": 0.1355351998936385,
    "sampletime": 8.641229592030868,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 665,
    "reward_mean": 1.8287808370639915,
    "reward_max": 2.1348204830552038,
    "reward_min": 1.4899629860693948,
    "reward_std": 0.13744008257264936,
    "timesteps": 232011882,
    "learntime": 0.12334584002383053,
    "sampletime": 8.52782580605708,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 666,
    "reward_mean": 1.7957037724857388,
    "reward_max": 2.1245400083328887,
    "reward_min": 1.5279687526263919,
    "reward_std": 0.127561379801121,
    "timesteps": 232372602,
    "learntime": 0.13012481899932027,
    "sampletime": 8.534952549031004,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 667,
    "reward_mean": 1.8231036792887183,
    "reward_max": 2.0792309326281977,
    "reward_min": 1.5879463903485962,
    "reward_std": 0.12233075336336524,
    "timesteps": 232733322,
    "learntime": 0.13953736005350947,
    "sampletime": 8.602523705922067,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 668,
    "reward_mean": 1.826733944709401,
    "reward_max": 2.1139366586540915,
    "reward_min": 1.5213867041165914,
    "reward_std": 0.13954708906101962,
    "timesteps": 233094042,
    "learntime": 0.1370942930225283,
    "sampletime": 8.63772975304164,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 669,
    "reward_mean": 1.7916136695414888,
    "reward_max": 2.2297251352733407,
    "reward_min": 1.2725970654185694,
    "reward_std": 0.17899136465742185,
    "timesteps": 233454762,
    "learntime": 0.13202955410815775,
    "sampletime": 8.577881387900561,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 670,
    "reward_mean": 1.7877707143419177,
    "reward_max": 2.0921275319369355,
    "reward_min": 1.4918924275570467,
    "reward_std": 0.1328175180252871,
    "timesteps": 233815482,
    "learntime": 0.13570280000567436,
    "sampletime": 8.493269226979464,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 671,
    "reward_mean": 1.8353740581970137,
    "reward_max": 2.186766343861093,
    "reward_min": 1.3730226477509269,
    "reward_std": 0.17396581872288244,
    "timesteps": 234176202,
    "learntime": 0.13365914300084114,
    "sampletime": 8.56164318905212,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 672,
    "reward_mean": 1.829586553189296,
    "reward_max": 2.1910168630161517,
    "reward_min": 1.472762663936006,
    "reward_std": 0.14792460364392254,
    "timesteps": 234536922,
    "learntime": 0.13433445105329156,
    "sampletime": 8.621256449026987,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 673,
    "reward_mean": 1.8317097033559868,
    "reward_max": 2.10982226234222,
    "reward_min": 1.5606168721137523,
    "reward_std": 0.1237092589366308,
    "timesteps": 234897642,
    "learntime": 0.13869387796148658,
    "sampletime": 8.594219756079838,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 674,
    "reward_mean": 1.8909190125852051,
    "reward_max": 2.2172631865003907,
    "reward_min": 1.586458542364802,
    "reward_std": 0.15270243767810554,
    "timesteps": 235258362,
    "learntime": 0.12514284090138972,
    "sampletime": 8.501183623215184,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 675,
    "reward_mean": 1.9272244174404916,
    "reward_max": 2.30642200266734,
    "reward_min": 1.5587211228751867,
    "reward_std": 0.14600903754507316,
    "timesteps": 235619082,
    "learntime": 0.12841911311261356,
    "sampletime": 8.571379299042746,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 676,
    "reward_mean": 1.83758883186375,
    "reward_max": 2.1853197970665614,
    "reward_min": 1.3487572315275556,
    "reward_std": 0.14845457334434353,
    "timesteps": 235979802,
    "learntime": 0.13205027813091874,
    "sampletime": 8.509974922984838,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 677,
    "reward_mean": 1.7222010318667602,
    "reward_max": 2.074601461557462,
    "reward_min": 1.3065578730024223,
    "reward_std": 0.16220045359297575,
    "timesteps": 236340522,
    "learntime": 0.13192475005052984,
    "sampletime": 8.50023036194034,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 678,
    "reward_mean": 1.7616657129814652,
    "reward_max": 2.307063769884265,
    "reward_min": 1.3488773848106497,
    "reward_std": 0.1854397945316524,
    "timesteps": 236701242,
    "learntime": 0.1296259460505098,
    "sampletime": 8.444015915039927,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 679,
    "reward_mean": 1.733421366052346,
    "reward_max": 2.0775807799143458,
    "reward_min": 1.3826648526517202,
    "reward_std": 0.15935524770824533,
    "timesteps": 237061962,
    "learntime": 0.12515684799291193,
    "sampletime": 8.403073061956093,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 680,
    "reward_mean": 1.8652311227733418,
    "reward_max": 2.2709702705879757,
    "reward_min": 1.423024704155534,
    "reward_std": 0.17239702717649275,
    "timesteps": 237422682,
    "learntime": 0.1243825510609895,
    "sampletime": 8.612484056968242,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 681,
    "reward_mean": 1.851590598977795,
    "reward_max": 2.217272043000607,
    "reward_min": 1.4800833733849361,
    "reward_std": 0.14764060131789747,
    "timesteps": 237783402,
    "learntime": 0.1194696300663054,
    "sampletime": 8.50611469708383,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 682,
    "reward_mean": 1.387283794845739,
    "reward_max": 2.1318340557402475,
    "reward_min": -7.203090656670008,
    "reward_std": 1.891456453015329,
    "timesteps": 238143087,
    "learntime": 0.1280410869512707,
    "sampletime": 8.58928483701311,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 683,
    "reward_mean": 0.849559786018425,
    "reward_max": 1.9896198733826351,
    "reward_min": -17.350101143578566,
    "reward_std": 3.214134605980074,
    "timesteps": 238501737,
    "learntime": 0.13277401705272496,
    "sampletime": 8.509069695835933,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 684,
    "reward_mean": 1.7252223625029646,
    "reward_max": 2.039779002915814,
    "reward_min": 1.245244729073923,
    "reward_std": 0.17767351907829979,
    "timesteps": 238862457,
    "learntime": 0.1332316359039396,
    "sampletime": 8.533083513844758,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 685,
    "reward_mean": 1.8158152956646718,
    "reward_max": 2.3363165392356935,
    "reward_min": 1.4563070623641523,
    "reward_std": 0.20020295374825292,
    "timesteps": 239223177,
    "learntime": 0.13661386398598552,
    "sampletime": 8.61308669205755,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 686,
    "reward_mean": 1.787263309301164,
    "reward_max": 2.2704711382058567,
    "reward_min": 1.4010475412660237,
    "reward_std": 0.15131952916717128,
    "timesteps": 239583897,
    "learntime": 0.12489792192354798,
    "sampletime": 8.571352462051436,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 687,
    "reward_mean": 1.8089958384524039,
    "reward_max": 2.1264137879215075,
    "reward_min": 1.4690802392821432,
    "reward_std": 0.15286082050863412,
    "timesteps": 239944617,
    "learntime": 0.12464059586636722,
    "sampletime": 8.541857633041218,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 688,
    "reward_mean": 1.8273978653923808,
    "reward_max": 2.270299703226752,
    "reward_min": 1.4770792789883336,
    "reward_std": 0.18131336738503667,
    "timesteps": 240305337,
    "learntime": 0.13732610689476132,
    "sampletime": 8.60601791087538,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 689,
    "reward_mean": 1.7733653809887877,
    "reward_max": 2.219091567182629,
    "reward_min": 1.0515744249384023,
    "reward_std": 0.2088693170640365,
    "timesteps": 240666057,
    "learntime": 0.12855357117950916,
    "sampletime": 8.517332328017801,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 690,
    "reward_mean": 1.8070349838908695,
    "reward_max": 2.1535406114734603,
    "reward_min": 1.4658920178225123,
    "reward_std": 0.15595220128378448,
    "timesteps": 241026777,
    "learntime": 0.1413707109168172,
    "sampletime": 8.557053311960772,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 691,
    "reward_mean": 1.2953323795547902,
    "reward_max": 2.0765790625080207,
    "reward_min": -7.372890829253294,
    "reward_std": 1.893922175244105,
    "timesteps": 241386291,
    "learntime": 0.12519691605120897,
    "sampletime": 8.507294724928215,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 692,
    "reward_mean": 1.7458994242329835,
    "reward_max": 2.123794507094619,
    "reward_min": 1.3572863563643585,
    "reward_std": 0.1497332736003635,
    "timesteps": 241747011,
    "learntime": 0.13286909111775458,
    "sampletime": 8.585334756877273,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 693,
    "reward_mean": 1.8494403768989298,
    "reward_max": 2.219848836466551,
    "reward_min": 1.461120582032227,
    "reward_std": 0.1544109232646162,
    "timesteps": 242107731,
    "learntime": 0.12568414909765124,
    "sampletime": 8.721306302119046,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 694,
    "reward_mean": 1.8758956409230627,
    "reward_max": 2.178296658191051,
    "reward_min": 1.4400628727223965,
    "reward_std": 0.15426429994139387,
    "timesteps": 242468451,
    "learntime": 0.12910770601592958,
    "sampletime": 8.562836509896442,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 695,
    "reward_mean": 1.8087125418947512,
    "reward_max": 2.1927885716766875,
    "reward_min": 1.4541865798307803,
    "reward_std": 0.14197460704975692,
    "timesteps": 242829171,
    "learntime": 0.1311769241001457,
    "sampletime": 8.611047091893852,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 696,
    "reward_mean": 1.7777398482957143,
    "reward_max": 2.101101664398534,
    "reward_min": 1.502243950560856,
    "reward_std": 0.12309592303025571,
    "timesteps": 243189891,
    "learntime": 0.1248794209677726,
    "sampletime": 8.553004748886451,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 697,
    "reward_mean": 0.9666236413420219,
    "reward_max": 2.273940701891354,
    "reward_min": -16.20327052771013,
    "reward_std": 3.039562457472764,
    "timesteps": 243548217,
    "learntime": 0.13486976502463222,
    "sampletime": 8.45216778991744,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 698,
    "reward_mean": 1.858519101867301,
    "reward_max": 2.1978487161298563,
    "reward_min": 1.5279074122167466,
    "reward_std": 0.15846031114856052,
    "timesteps": 243908937,
    "learntime": 0.1298491950146854,
    "sampletime": 8.593487706035376,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 699,
    "reward_mean": 1.7863416524418307,
    "reward_max": 2.1581717584631392,
    "reward_min": 1.3858157820520998,
    "reward_std": 0.13854233636184696,
    "timesteps": 244269657,
    "learntime": 0.12364285090006888,
    "sampletime": 8.646561315981671,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 700,
    "reward_mean": 1.399023358528243,
    "reward_max": 2.1893602477741094,
    "reward_min": -7.031748287855987,
    "reward_std": 1.8540365117582156,
    "timesteps": 244629393,
    "learntime": 0.12551729590632021,
    "sampletime": 8.525630499934778,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 701,
    "reward_mean": 1.771515385238239,
    "reward_max": 2.0206674746675115,
    "reward_min": 1.4192504823158443,
    "reward_std": 0.12360484956911753,
    "timesteps": 244990113,
    "learntime": 0.13205701997503638,
    "sampletime": 8.641157766105607,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 702,
    "reward_mean": 1.7040489925762528,
    "reward_max": 2.0197517045801785,
    "reward_min": 1.3637365295311812,
    "reward_std": 0.13983055779668607,
    "timesteps": 245350833,
    "learntime": 0.12498439103364944,
    "sampletime": 8.62558500887826,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 703,
    "reward_mean": 0.535158548914239,
    "reward_max": 2.151168301898803,
    "reward_min": -7.313885987937367,
    "reward_std": 3.078599876558556,
    "timesteps": 245708979,
    "learntime": 0.1328217377886176,
    "sampletime": 8.4857922650408,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 704,
    "reward_mean": 1.7955023585137717,
    "reward_max": 2.0795641141153394,
    "reward_min": 1.4551351120203908,
    "reward_std": 0.14340375785014614,
    "timesteps": 246069699,
    "learntime": 0.13065986102446914,
    "sampletime": 8.517100716009736,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 705,
    "reward_mean": 1.4025193146439818,
    "reward_max": 2.2737634000897544,
    "reward_min": -7.083007307659667,
    "reward_std": 1.822264900899247,
    "timesteps": 246429507,
    "learntime": 0.1290396419353783,
    "sampletime": 8.564403153024614,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 706,
    "reward_mean": 1.0393602489686855,
    "reward_max": 2.1773879824241784,
    "reward_min": -7.079189962319412,
    "reward_std": 2.530197895044705,
    "timesteps": 246788403,
    "learntime": 0.1420221021398902,
    "sampletime": 8.57300835615024,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 707,
    "reward_mean": 1.4014180475921374,
    "reward_max": 2.2609977217260586,
    "reward_min": -6.964641280532255,
    "reward_std": 1.8563502128908296,
    "timesteps": 247148211,
    "learntime": 0.12477632402442396,
    "sampletime": 8.521076703909785,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 708,
    "reward_mean": 1.7830447097969717,
    "reward_max": 2.168434517621238,
    "reward_min": 1.4137348823246068,
    "reward_std": 0.16939157273225652,
    "timesteps": 247508931,
    "learntime": 0.12951587396673858,
    "sampletime": 8.533222319092602,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 709,
    "reward_mean": 1.7819531456796018,
    "reward_max": 2.0894084697744484,
    "reward_min": 1.46781491592992,
    "reward_std": 0.1414362741478087,
    "timesteps": 247869651,
    "learntime": 0.13360583293251693,
    "sampletime": 8.621682123048231,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 710,
    "reward_mean": 1.8201146912356614,
    "reward_max": 2.1293148701196025,
    "reward_min": 1.3301034273692578,
    "reward_std": 0.14721773325573956,
    "timesteps": 248230371,
    "learntime": 0.14136806805618107,
    "sampletime": 8.549606109969318,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 711,
    "reward_mean": 1.79430936153893,
    "reward_max": 2.1513222700097776,
    "reward_min": 1.4350789765966383,
    "reward_std": 0.15183444591344994,
    "timesteps": 248591091,
    "learntime": 0.13627826608717442,
    "sampletime": 8.654220257187262,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 712,
    "reward_mean": 1.7832569543348016,
    "reward_max": 2.0819561033259184,
    "reward_min": 1.41325450548902,
    "reward_std": 0.1400416342329905,
    "timesteps": 248951811,
    "learntime": 0.14052657410502434,
    "sampletime": 8.496199031826109,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 713,
    "reward_mean": 1.8374434417578356,
    "reward_max": 2.2872313705341734,
    "reward_min": 1.460523837094011,
    "reward_std": 0.17053938787032982,
    "timesteps": 249312531,
    "learntime": 0.13111493596807122,
    "sampletime": 8.549854298122227,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 714,
    "reward_mean": 1.884165025548116,
    "reward_max": 2.1528286382478314,
    "reward_min": 1.553016115715513,
    "reward_std": 0.15032503994015292,
    "timesteps": 249673251,
    "learntime": 0.13183191395364702,
    "sampletime": 8.569714314071462,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 715,
    "reward_mean": 1.822402454527064,
    "reward_max": 2.0870982303185297,
    "reward_min": 1.3881453490255125,
    "reward_std": 0.156828307028513,
    "timesteps": 250033971,
    "learntime": 0.1367477048188448,
    "sampletime": 8.59400199400261,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 716,
    "reward_mean": 1.8075355574225624,
    "reward_max": 2.232841151688867,
    "reward_min": 1.4381964886807956,
    "reward_std": 0.17809562207299176,
    "timesteps": 250394691,
    "learntime": 0.12691916315816343,
    "sampletime": 8.569149130955338,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 717,
    "reward_mean": 1.746784219197785,
    "reward_max": 2.0986085770568788,
    "reward_min": 1.3091973119069598,
    "reward_std": 0.16488969570568277,
    "timesteps": 250755411,
    "learntime": 0.12643633503466845,
    "sampletime": 8.578021929133683,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 718,
    "reward_mean": 1.500027724103201,
    "reward_max": 2.224722748363595,
    "reward_min": -15.997790768913658,
    "reward_std": 2.4775888306443545,
    "timesteps": 251114985,
    "learntime": 0.1285493979230523,
    "sampletime": 8.440415994031355,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 719,
    "reward_mean": 1.850480251814766,
    "reward_max": 2.3526058170739805,
    "reward_min": 1.5118426583040565,
    "reward_std": 0.16900572847013404,
    "timesteps": 251475705,
    "learntime": 0.12614670884795487,
    "sampletime": 8.690274670021608,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 720,
    "reward_mean": 1.800928165511559,
    "reward_max": 2.2996613493676024,
    "reward_min": 1.3658648602361065,
    "reward_std": 0.14910459523671346,
    "timesteps": 251836425,
    "learntime": 0.12938933493569493,
    "sampletime": 8.51116605498828,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 721,
    "reward_mean": 1.791851822008315,
    "reward_max": 2.1460368805564887,
    "reward_min": 1.3325748243627846,
    "reward_std": 0.15766992877411676,
    "timesteps": 252197145,
    "learntime": 0.13232582504861057,
    "sampletime": 8.599193521076813,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 722,
    "reward_mean": 1.4772003553547535,
    "reward_max": 2.1768822296536627,
    "reward_min": -6.970600068315187,
    "reward_std": 1.7656072870185362,
    "timesteps": 252556908,
    "learntime": 0.12301005888730288,
    "sampletime": 8.477007102919742,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 723,
    "reward_mean": 1.7858953534916504,
    "reward_max": 2.0281881861543853,
    "reward_min": 1.4911409644656928,
    "reward_std": 0.13068105006664044,
    "timesteps": 252917628,
    "learntime": 0.13195501593872905,
    "sampletime": 8.634792278055102,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 724,
    "reward_mean": 1.7675197647452696,
    "reward_max": 2.1103638777911455,
    "reward_min": 1.4636280247537359,
    "reward_std": 0.12524878061376735,
    "timesteps": 253278348,
    "learntime": 0.12546901893801987,
    "sampletime": 8.631404560059309,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 725,
    "reward_mean": 1.7494325924010445,
    "reward_max": 2.0985588423456187,
    "reward_min": 1.3878939206479097,
    "reward_std": 0.13619463025584969,
    "timesteps": 253639068,
    "learntime": 0.13319106819108129,
    "sampletime": 8.505001097917557,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 726,
    "reward_mean": 1.7975196676941891,
    "reward_max": 2.277821014894772,
    "reward_min": 1.5074238013158625,
    "reward_std": 0.191501408783266,
    "timesteps": 253999788,
    "learntime": 0.14888986409641802,
    "sampletime": 8.516616001958027,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 727,
    "reward_mean": 1.7931129489436344,
    "reward_max": 2.0935116345115765,
    "reward_min": 1.4047278925268463,
    "reward_std": 0.172016202130454,
    "timesteps": 254360508,
    "learntime": 0.12297956785187125,
    "sampletime": 8.468671848066151,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 728,
    "reward_mean": 1.7451595736172572,
    "reward_max": 2.0485583571805317,
    "reward_min": 1.4192711348419584,
    "reward_std": 0.14633841784202278,
    "timesteps": 254721228,
    "learntime": 0.1270778519101441,
    "sampletime": 8.60303597804159,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 729,
    "reward_mean": 1.7943673649348992,
    "reward_max": 2.1244307021014586,
    "reward_min": 1.3472543346535064,
    "reward_std": 0.16340185616329958,
    "timesteps": 255081948,
    "learntime": 0.13213458703830838,
    "sampletime": 8.50554440007545,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 730,
    "reward_mean": 1.7812684237980148,
    "reward_max": 2.0260777156570713,
    "reward_min": 1.4989325057337695,
    "reward_std": 0.1320118694664345,
    "timesteps": 255442668,
    "learntime": 0.12949881213717163,
    "sampletime": 8.573864858830348,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 731,
    "reward_mean": 1.752328532131683,
    "reward_max": 2.0881091998501975,
    "reward_min": 1.3807917707740789,
    "reward_std": 0.12450483859090915,
    "timesteps": 255803388,
    "learntime": 0.128073011059314,
    "sampletime": 8.441231986042112,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 732,
    "reward_mean": 1.7731047772129778,
    "reward_max": 2.174775776899903,
    "reward_min": 1.421283421698411,
    "reward_std": 0.16621673142032228,
    "timesteps": 256164108,
    "learntime": 0.13008528295904398,
    "sampletime": 8.501028080005199,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 733,
    "reward_mean": 1.8245912324185325,
    "reward_max": 2.2103007802048293,
    "reward_min": 1.4933309736097138,
    "reward_std": 0.13794023828336704,
    "timesteps": 256524828,
    "learntime": 0.13219784502871335,
    "sampletime": 8.632314021000639,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 734,
    "reward_mean": 1.8101470186660267,
    "reward_max": 2.1653490400860744,
    "reward_min": 1.415436883806248,
    "reward_std": 0.14687150862538745,
    "timesteps": 256885548,
    "learntime": 0.13305982295423746,
    "sampletime": 8.527835385873914,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 735,
    "reward_mean": 1.4147439531134536,
    "reward_max": 2.257178343767815,
    "reward_min": -7.069527821774089,
    "reward_std": 1.830403419714242,
    "timesteps": 257245143,
    "learntime": 0.1322083231061697,
    "sampletime": 8.559462870005518,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 736,
    "reward_mean": 1.8686812396226675,
    "reward_max": 2.1223333254350654,
    "reward_min": 1.5282478143604772,
    "reward_std": 0.13594772422611168,
    "timesteps": 257605863,
    "learntime": 0.13236585911363363,
    "sampletime": 8.609091257909313,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 737,
    "reward_mean": 1.7813568299830882,
    "reward_max": 2.081491816825952,
    "reward_min": 1.4472881725382498,
    "reward_std": 0.14374393829432525,
    "timesteps": 257966583,
    "learntime": 0.1377303118351847,
    "sampletime": 8.6283335799817,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 738,
    "reward_mean": 1.8055610930403145,
    "reward_max": 2.1492708726842498,
    "reward_min": 1.4623308727362494,
    "reward_std": 0.13856953497334681,
    "timesteps": 258327303,
    "learntime": 0.13006469001993537,
    "sampletime": 8.465994619065896,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 739,
    "reward_mean": 0.09481195226828334,
    "reward_max": 2.0060558500064682,
    "reward_min": -16.47184263632605,
    "reward_std": 4.141508051236038,
    "timesteps": 258684102,
    "learntime": 0.13377602701075375,
    "sampletime": 8.432577179046348,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 740,
    "reward_mean": 1.8523830723163506,
    "reward_max": 2.1612355186124166,
    "reward_min": 1.5844317711889717,
    "reward_std": 0.1551508332906066,
    "timesteps": 259044822,
    "learntime": 0.13004192616790533,
    "sampletime": 8.447986226063222,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 741,
    "reward_mean": 1.4042260362328416,
    "reward_max": 2.2122406873774394,
    "reward_min": -7.577045130494025,
    "reward_std": 1.9185606168506624,
    "timesteps": 259404588,
    "learntime": 0.13615000201389194,
    "sampletime": 8.480036980938166,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 742,
    "reward_mean": 1.8402643407704602,
    "reward_max": 2.2349909984817087,
    "reward_min": 1.475789473630189,
    "reward_std": 0.15127743262974944,
    "timesteps": 259765308,
    "learntime": 0.13634388288483024,
    "sampletime": 8.58031477802433,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 743,
    "reward_mean": 1.8109386023167158,
    "reward_max": 2.139774887516977,
    "reward_min": 1.457654237179227,
    "reward_std": 0.1501083994440284,
    "timesteps": 260126028,
    "learntime": 0.14113109186291695,
    "sampletime": 8.4762290220242,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 744,
    "reward_mean": 1.8508589412898835,
    "reward_max": 2.2379856255605692,
    "reward_min": 1.5435503957172207,
    "reward_std": 0.16252672185315978,
    "timesteps": 260486748,
    "learntime": 0.13618072401732206,
    "sampletime": 8.544735588133335,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 745,
    "reward_mean": 1.8152396387635192,
    "reward_max": 2.2455340947490168,
    "reward_min": 1.5092922822663999,
    "reward_std": 0.16713575236766637,
    "timesteps": 260847468,
    "learntime": 0.12982858181931078,
    "sampletime": 8.457208714913577,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 746,
    "reward_mean": 1.7906263265708116,
    "reward_max": 2.162339676100984,
    "reward_min": 1.5126171433067694,
    "reward_std": 0.14095130310472806,
    "timesteps": 261208188,
    "learntime": 0.13615288096480072,
    "sampletime": 8.617051794892177,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 747,
    "reward_mean": 1.7801434463704215,
    "reward_max": 2.0748810815509353,
    "reward_min": 1.4701866065839886,
    "reward_std": 0.13401041479426562,
    "timesteps": 261568908,
    "learntime": 0.12989981402643025,
    "sampletime": 8.565612139878795,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 748,
    "reward_mean": 1.8075529866343314,
    "reward_max": 2.0991623931666683,
    "reward_min": 1.4435287684170877,
    "reward_std": 0.154376890119446,
    "timesteps": 261929628,
    "learntime": 0.13292571203783154,
    "sampletime": 8.539124886970967,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 749,
    "reward_mean": 1.7843192604366487,
    "reward_max": 2.147984684332075,
    "reward_min": 1.4149560878885832,
    "reward_std": 0.17472928415140287,
    "timesteps": 262290348,
    "learntime": 0.11981927207671106,
    "sampletime": 8.558876391034573,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 750,
    "reward_mean": 1.4871691634158795,
    "reward_max": 2.3301212815550207,
    "reward_min": -6.755905707382641,
    "reward_std": 1.785308849697127,
    "timesteps": 262649889,
    "learntime": 0.13188460399396718,
    "sampletime": 8.47461461299099,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 751,
    "reward_mean": 1.8654202134261992,
    "reward_max": 2.3666223244799736,
    "reward_min": 1.5353402441998873,
    "reward_std": 0.1783998085144636,
    "timesteps": 263010609,
    "learntime": 0.1287816611584276,
    "sampletime": 8.64691643603146,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 752,
    "reward_mean": 1.8494623071234264,
    "reward_max": 2.2887216643906507,
    "reward_min": 1.4722624512558609,
    "reward_std": 0.18061515497879804,
    "timesteps": 263371329,
    "learntime": 0.13331222697161138,
    "sampletime": 8.555979368044063,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 753,
    "reward_mean": 1.8013902787797451,
    "reward_max": 2.141950480814557,
    "reward_min": 1.5013880106041924,
    "reward_std": 0.14050959791012232,
    "timesteps": 263732049,
    "learntime": 0.1294349180534482,
    "sampletime": 8.535335131920874,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 754,
    "reward_mean": 1.8550426416328851,
    "reward_max": 2.198725816269868,
    "reward_min": 1.3903831087708076,
    "reward_std": 0.16752734310343642,
    "timesteps": 264092769,
    "learntime": 0.12376439687795937,
    "sampletime": 8.513743788935244,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 755,
    "reward_mean": 1.8155042925690785,
    "reward_max": 2.2395507922162836,
    "reward_min": 1.4204739850564758,
    "reward_std": 0.19003283554652856,
    "timesteps": 264453489,
    "learntime": 0.13626358401961625,
    "sampletime": 8.611169974086806,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 756,
    "reward_mean": 1.869515554038307,
    "reward_max": 2.4488597961502445,
    "reward_min": 1.1353096956754032,
    "reward_std": 0.19319267342464422,
    "timesteps": 264814209,
    "learntime": 0.128891363972798,
    "sampletime": 8.54957815213129,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 757,
    "reward_mean": 1.8478006299409713,
    "reward_max": 2.2283464984917134,
    "reward_min": 1.3696860952980119,
    "reward_std": 0.1807814323494912,
    "timesteps": 265174929,
    "learntime": 0.1406783820129931,
    "sampletime": 8.569960137130693,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 758,
    "reward_mean": 1.910279878244748,
    "reward_max": 2.4670077915620294,
    "reward_min": 1.388310074407577,
    "reward_std": 0.20285271449242098,
    "timesteps": 265535649,
    "learntime": 0.13338493998162448,
    "sampletime": 8.549334638984874,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 759,
    "reward_mean": 1.8449593106046318,
    "reward_max": 2.1262322684862833,
    "reward_min": 1.5244437101236188,
    "reward_std": 0.134221174003158,
    "timesteps": 265896369,
    "learntime": 0.1342990598641336,
    "sampletime": 8.444880196126178,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 760,
    "reward_mean": 1.808692952986564,
    "reward_max": 2.2996488464713982,
    "reward_min": 1.5040399770527542,
    "reward_std": 0.1457494823434223,
    "timesteps": 266257089,
    "learntime": 0.12460205797106028,
    "sampletime": 8.585199513006955,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 761,
    "reward_mean": 1.8677890191935687,
    "reward_max": 2.2756342115303987,
    "reward_min": 1.5029332491456309,
    "reward_std": 0.14977980881032452,
    "timesteps": 266617809,
    "learntime": 0.12641265196725726,
    "sampletime": 8.513667162973434,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 762,
    "reward_mean": 1.8408963505588756,
    "reward_max": 2.3517678198863208,
    "reward_min": 1.427206427713494,
    "reward_std": 0.16143344550511735,
    "timesteps": 266978529,
    "learntime": 0.132775051984936,
    "sampletime": 8.577189214993268,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 763,
    "reward_mean": 1.8458462626520165,
    "reward_max": 2.416668568763158,
    "reward_min": 1.5303943965065423,
    "reward_std": 0.16217689729030646,
    "timesteps": 267339249,
    "learntime": 0.13545019109733403,
    "sampletime": 8.529411144787446,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 764,
    "reward_mean": 1.3834302992147438,
    "reward_max": 2.121340423145956,
    "reward_min": -7.043169145317129,
    "reward_std": 1.868116225537776,
    "timesteps": 267698787,
    "learntime": 0.11937806499190629,
    "sampletime": 8.632386213866994,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 765,
    "reward_mean": 1.073088626126967,
    "reward_max": 2.1780705470873993,
    "reward_min": -7.138221757147803,
    "reward_std": 2.5039324078396623,
    "timesteps": 268057143,
    "learntime": 0.1305783821735531,
    "sampletime": 8.465385752962902,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 766,
    "reward_mean": 1.4318125443349192,
    "reward_max": 2.1068089693807317,
    "reward_min": -6.956513111987575,
    "reward_std": 1.7624234476460898,
    "timesteps": 268416681,
    "learntime": 0.1300802049227059,
    "sampletime": 8.64327814313583,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 767,
    "reward_mean": 1.835661624132051,
    "reward_max": 2.1962117651362645,
    "reward_min": 1.5192077040855723,
    "reward_std": 0.13857401528367141,
    "timesteps": 268777401,
    "learntime": 0.13823798089288175,
    "sampletime": 8.520631085848436,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 768,
    "reward_mean": 1.8614759752988554,
    "reward_max": 2.2590709826520934,
    "reward_min": 1.5787947712832975,
    "reward_std": 0.1278029410479298,
    "timesteps": 269138121,
    "learntime": 0.13158368016593158,
    "sampletime": 8.527680383063853,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 769,
    "reward_mean": 1.0724970072661217,
    "reward_max": 2.201427088819344,
    "reward_min": -7.589342966640481,
    "reward_std": 2.538997335123792,
    "timesteps": 269496417,
    "learntime": 0.1359048830345273,
    "sampletime": 8.509187079034746,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 770,
    "reward_mean": 1.3492188095205064,
    "reward_max": 1.9823063791140363,
    "reward_min": -7.378927317490295,
    "reward_std": 1.9264865879092778,
    "timesteps": 269855925,
    "learntime": 0.13074614410288632,
    "sampletime": 8.482256245799363,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 771,
    "reward_mean": 1.709374613462995,
    "reward_max": 2.173808381384744,
    "reward_min": 1.213996318515536,
    "reward_std": 0.1733011903679378,
    "timesteps": 270216645,
    "learntime": 0.13529854314401746,
    "sampletime": 8.617672795196995,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 772,
    "reward_mean": 1.8066692074513124,
    "reward_max": 2.16113178060517,
    "reward_min": 1.4218008022920279,
    "reward_std": 0.19004563683435308,
    "timesteps": 270577365,
    "learntime": 0.13452959596179426,
    "sampletime": 8.434843613998964,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 773,
    "reward_mean": 1.7848282187422293,
    "reward_max": 2.167672181866663,
    "reward_min": 1.4739673479237916,
    "reward_std": 0.14073129109092544,
    "timesteps": 270938085,
    "learntime": 0.13780200900509953,
    "sampletime": 8.567099621053785,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 774,
    "reward_mean": 1.8462147858158102,
    "reward_max": 2.355084039797979,
    "reward_min": 1.5332335821268233,
    "reward_std": 0.15470847759581458,
    "timesteps": 271298805,
    "learntime": 0.12879307195544243,
    "sampletime": 8.59423556085676,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 775,
    "reward_mean": 1.8167008260644824,
    "reward_max": 2.278953681290711,
    "reward_min": 1.3359069081524242,
    "reward_std": 0.18534459317541158,
    "timesteps": 271659525,
    "learntime": 0.13063046406023204,
    "sampletime": 8.565984809072688,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 776,
    "reward_mean": 1.7349004000974575,
    "reward_max": 2.10540276085499,
    "reward_min": 1.3019675685720722,
    "reward_std": 0.16636965701609036,
    "timesteps": 272020245,
    "learntime": 0.13714108406566083,
    "sampletime": 8.552252148045227,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 777,
    "reward_mean": 1.788121848363975,
    "reward_max": 2.1381858119716366,
    "reward_min": 1.434929109885792,
    "reward_std": 0.1411266900275324,
    "timesteps": 272380965,
    "learntime": 0.135758345015347,
    "sampletime": 8.480732753872871,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 778,
    "reward_mean": 1.8868665367273074,
    "reward_max": 2.2575102571369774,
    "reward_min": 1.4044693206705012,
    "reward_std": 0.19389797919631963,
    "timesteps": 272741685,
    "learntime": 0.13648702506907284,
    "sampletime": 8.55917538702488,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 779,
    "reward_mean": 1.833970855764856,
    "reward_max": 2.149315343620288,
    "reward_min": 1.3775520677057382,
    "reward_std": 0.1480539531387859,
    "timesteps": 273102405,
    "learntime": 0.12884982489049435,
    "sampletime": 8.5279760658741,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 780,
    "reward_mean": 1.39548294018315,
    "reward_max": 2.1631847133200264,
    "reward_min": -7.236286300273303,
    "reward_std": 1.9112045990343742,
    "timesteps": 273461931,
    "learntime": 0.12460643891245127,
    "sampletime": 8.557389054913074,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 781,
    "reward_mean": 1.8414753790760106,
    "reward_max": 2.2536279148215783,
    "reward_min": 1.3236128952086053,
    "reward_std": 0.17660861287302146,
    "timesteps": 273822651,
    "learntime": 0.12927515502087772,
    "sampletime": 8.484169277828187,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 782,
    "reward_mean": 1.7606881786009412,
    "reward_max": 2.2657281019862454,
    "reward_min": 1.3544963448040293,
    "reward_std": 0.1605661262230312,
    "timesteps": 274183371,
    "learntime": 0.13407819508574903,
    "sampletime": 8.453527823090553,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 783,
    "reward_mean": 1.771538925440344,
    "reward_max": 2.238269633528857,
    "reward_min": 1.4834018589301372,
    "reward_std": 0.14985780993068365,
    "timesteps": 274544091,
    "learntime": 0.13768599787726998,
    "sampletime": 8.535214317031205,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 784,
    "reward_mean": 1.7824357669664257,
    "reward_max": 2.0670979444952904,
    "reward_min": 1.4298128969782142,
    "reward_std": 0.1400421461137658,
    "timesteps": 274904811,
    "learntime": 0.13244001404382288,
    "sampletime": 8.590595067013055,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 785,
    "reward_mean": 1.7795200278788672,
    "reward_max": 2.109407879877833,
    "reward_min": 1.5282231576517589,
    "reward_std": 0.12248547391910872,
    "timesteps": 275265531,
    "learntime": 0.12041432689875364,
    "sampletime": 8.539403923088685,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 786,
    "reward_mean": 1.3617935407751558,
    "reward_max": 2.074517120621343,
    "reward_min": -7.598069639728322,
    "reward_std": 1.905267427083317,
    "timesteps": 275625051,
    "learntime": 0.14027055399492383,
    "sampletime": 8.463479044148698,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 787,
    "reward_mean": 1.7685706333839675,
    "reward_max": 2.1942657954659235,
    "reward_min": 1.3067543010763585,
    "reward_std": 0.16972099780019653,
    "timesteps": 275985771,
    "learntime": 0.13897166214883327,
    "sampletime": 8.456813071854413,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 788,
    "reward_mean": 1.3232886531496932,
    "reward_max": 2.0639996302391697,
    "reward_min": -7.309635142234836,
    "reward_std": 1.856724504966042,
    "timesteps": 276345474,
    "learntime": 0.12718884111382067,
    "sampletime": 8.58951561897993,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 789,
    "reward_mean": 1.7855867280298277,
    "reward_max": 2.0967254835971554,
    "reward_min": 1.379171581686629,
    "reward_std": 0.1604080869068771,
    "timesteps": 276706194,
    "learntime": 0.1346999821253121,
    "sampletime": 8.63463558186777,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 790,
    "reward_mean": 1.8210613823888013,
    "reward_max": 2.2142463345627394,
    "reward_min": 1.3349846958951765,
    "reward_std": 0.16161123991786253,
    "timesteps": 277066914,
    "learntime": 0.14024224900640547,
    "sampletime": 8.60795077914372,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 791,
    "reward_mean": 1.8015669868220376,
    "reward_max": 2.2473268703624565,
    "reward_min": 1.4577774130334655,
    "reward_std": 0.14899964914197453,
    "timesteps": 277427634,
    "learntime": 0.1352453362196684,
    "sampletime": 8.448429386829957,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 792,
    "reward_mean": 1.8100029231156176,
    "reward_max": 2.192390783088435,
    "reward_min": 1.4396004963412183,
    "reward_std": 0.1706896165207232,
    "timesteps": 277788354,
    "learntime": 0.14184426004067063,
    "sampletime": 8.636400854913518,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 793,
    "reward_mean": 1.831752060969884,
    "reward_max": 2.1505380360917585,
    "reward_min": 1.5662049476064335,
    "reward_std": 0.14145058405568844,
    "timesteps": 278149074,
    "learntime": 0.1346176159568131,
    "sampletime": 8.54593509202823,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 794,
    "reward_mean": 1.899184860320936,
    "reward_max": 2.3664009414161673,
    "reward_min": 1.5512800721035354,
    "reward_std": 0.15370543892032623,
    "timesteps": 278509794,
    "learntime": 0.12401278899051249,
    "sampletime": 8.482392692007124,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 795,
    "reward_mean": 1.863483504912038,
    "reward_max": 2.202073602933632,
    "reward_min": 1.5809492382845305,
    "reward_std": 0.14141623515557641,
    "timesteps": 278870514,
    "learntime": 0.12617702689021826,
    "sampletime": 8.528594861971214,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 796,
    "reward_mean": 1.8529622450054193,
    "reward_max": 2.2867508126558547,
    "reward_min": 0.9751279115549853,
    "reward_std": 0.21871265905401008,
    "timesteps": 279231234,
    "learntime": 0.12760259816423059,
    "sampletime": 8.456889738095924,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 797,
    "reward_mean": 1.859069527049,
    "reward_max": 2.2274321567189537,
    "reward_min": 1.4710981469975308,
    "reward_std": 0.1726345555824753,
    "timesteps": 279591954,
    "learntime": 0.13745676004327834,
    "sampletime": 8.521544746123254,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 798,
    "reward_mean": 1.3458123848939636,
    "reward_max": 2.0472351818138503,
    "reward_min": -7.383747998752039,
    "reward_std": 1.878340505411754,
    "timesteps": 279951741,
    "learntime": 0.13912689196877182,
    "sampletime": 8.566960284020752,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 799,
    "reward_mean": 1.8066893158977502,
    "reward_max": 2.2190863275027346,
    "reward_min": 1.4114467917631035,
    "reward_std": 0.16614152248662373,
    "timesteps": 280312461,
    "learntime": 0.1362055391073227,
    "sampletime": 8.53575204196386,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 800,
    "reward_mean": 1.7839790451087083,
    "reward_max": 2.143098263559458,
    "reward_min": 1.518609364053794,
    "reward_std": 0.13322871063783376,
    "timesteps": 280673181,
    "learntime": 0.13261876488104463,
    "sampletime": 8.569339785957709,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 801,
    "reward_mean": 1.86830462856766,
    "reward_max": 2.173796260674749,
    "reward_min": 1.4048177096475303,
    "reward_std": 0.1242828509918945,
    "timesteps": 281033901,
    "learntime": 0.11628606193698943,
    "sampletime": 8.539297834038734,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 802,
    "reward_mean": 1.8773191736002128,
    "reward_max": 2.2644409105731995,
    "reward_min": 1.6062263884144163,
    "reward_std": 0.16380687525441928,
    "timesteps": 281394621,
    "learntime": 0.13189167785458267,
    "sampletime": 8.460327676031739,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 803,
    "reward_mean": 1.8770654723786113,
    "reward_max": 2.2305943830135857,
    "reward_min": 1.5263787125815818,
    "reward_std": 0.14453457458659308,
    "timesteps": 281755341,
    "learntime": 0.12459876807406545,
    "sampletime": 8.547648993087932,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 804,
    "reward_mean": 1.8832286775065221,
    "reward_max": 2.299175754787733,
    "reward_min": 1.531252862150058,
    "reward_std": 0.1503479067948476,
    "timesteps": 282116061,
    "learntime": 0.13751781289465725,
    "sampletime": 8.663332208059728,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 805,
    "reward_mean": 1.8079685317517047,
    "reward_max": 2.136890511843374,
    "reward_min": 1.3711831552632636,
    "reward_std": 0.1622760998243632,
    "timesteps": 282476781,
    "learntime": 0.1352510720025748,
    "sampletime": 8.532863001106307,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 806,
    "reward_mean": 1.7529275008777252,
    "reward_max": 2.2333166963314066,
    "reward_min": 1.507179553810573,
    "reward_std": 0.1566241933527993,
    "timesteps": 282837501,
    "learntime": 0.13409888511523604,
    "sampletime": 8.618502738885581,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 807,
    "reward_mean": 1.7503795171219176,
    "reward_max": 2.0953996200177305,
    "reward_min": 1.3992485411775577,
    "reward_std": 0.147442999452358,
    "timesteps": 283198221,
    "learntime": 0.18575606308877468,
    "sampletime": 8.564900958910584,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 808,
    "reward_mean": 1.8446872700338586,
    "reward_max": 2.2278125770034287,
    "reward_min": 1.5886670444231228,
    "reward_std": 0.12361033718206213,
    "timesteps": 283558941,
    "learntime": 0.12542629288509488,
    "sampletime": 8.616209679981694,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 809,
    "reward_mean": 1.8304380809093794,
    "reward_max": 2.2810945642448814,
    "reward_min": 1.4706146374891302,
    "reward_std": 0.1611059571085629,
    "timesteps": 283919661,
    "learntime": 0.14391037891618907,
    "sampletime": 8.536582140950486,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 810,
    "reward_mean": 1.9011530312129483,
    "reward_max": 2.1925959084635673,
    "reward_min": 1.5968981599717396,
    "reward_std": 0.13497343678895773,
    "timesteps": 284280381,
    "learntime": 0.1474039249587804,
    "sampletime": 8.534755293047056,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 811,
    "reward_mean": 1.9056707289246195,
    "reward_max": 2.442248337516499,
    "reward_min": 1.3524375838883704,
    "reward_std": 0.18112831776470123,
    "timesteps": 284641101,
    "learntime": 0.13378827087581158,
    "sampletime": 8.549249448115006,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 812,
    "reward_mean": 1.8376975159179534,
    "reward_max": 2.2662419848563826,
    "reward_min": 1.5346235215141784,
    "reward_std": 0.17292215785399181,
    "timesteps": 285001821,
    "learntime": 0.13806941895745695,
    "sampletime": 8.547939402982593,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 813,
    "reward_mean": 1.8770950076782917,
    "reward_max": 2.2107272416914268,
    "reward_min": 1.4723880841029844,
    "reward_std": 0.16016010379005194,
    "timesteps": 285362541,
    "learntime": 0.12969613703899086,
    "sampletime": 8.60404962906614,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 814,
    "reward_mean": 1.358423656031226,
    "reward_max": 2.164449762623528,
    "reward_min": -7.600588938955107,
    "reward_std": 1.976568063673195,
    "timesteps": 285722055,
    "learntime": 0.13213499099947512,
    "sampletime": 8.605754283023998,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 815,
    "reward_mean": 1.7546938724187406,
    "reward_max": 2.1265429166978147,
    "reward_min": 1.4588633523506147,
    "reward_std": 0.15951373630512672,
    "timesteps": 286082775,
    "learntime": 0.12576597998850048,
    "sampletime": 8.516471522860229,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 816,
    "reward_mean": 1.7466338096092127,
    "reward_max": 2.1589309111150197,
    "reward_min": 1.417892628885577,
    "reward_std": 0.14763829113190333,
    "timesteps": 286443495,
    "learntime": 0.13155182590708137,
    "sampletime": 8.623482163064182,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 817,
    "reward_mean": 1.8007436968601156,
    "reward_max": 2.1048856949335315,
    "reward_min": 1.4498169761200446,
    "reward_std": 0.14859962979141905,
    "timesteps": 286804215,
    "learntime": 0.13077596900984645,
    "sampletime": 8.481734048109502,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 818,
    "reward_mean": 1.7844721172045765,
    "reward_max": 2.054738842689952,
    "reward_min": 1.4066225457724832,
    "reward_std": 0.14648237812133028,
    "timesteps": 287164935,
    "learntime": 0.12489431002177298,
    "sampletime": 8.402518758084625,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 819,
    "reward_mean": 1.8162420441046625,
    "reward_max": 2.231387689328667,
    "reward_min": 1.3070981617784112,
    "reward_std": 0.15840344339008963,
    "timesteps": 287525655,
    "learntime": 0.13172569312155247,
    "sampletime": 8.646908677881584,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 820,
    "reward_mean": 1.8341206594435342,
    "reward_max": 2.183090228915466,
    "reward_min": 1.4349286840579487,
    "reward_std": 0.1668667095039615,
    "timesteps": 287886375,
    "learntime": 0.13707163091748953,
    "sampletime": 8.534305232111365,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 821,
    "reward_mean": 1.8258299435465795,
    "reward_max": 2.346159630546797,
    "reward_min": 1.433452426526468,
    "reward_std": 0.17177528559630104,
    "timesteps": 288247095,
    "learntime": 0.1340661719441414,
    "sampletime": 8.497015363071114,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 822,
    "reward_mean": 1.7482032150493656,
    "reward_max": 2.2120529745465523,
    "reward_min": 1.3833899357193844,
    "reward_std": 0.19302644664598814,
    "timesteps": 288607815,
    "learntime": 0.12756524188444018,
    "sampletime": 8.463214924093336,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 823,
    "reward_mean": 1.8597118027410182,
    "reward_max": 2.224100208820092,
    "reward_min": 1.425020890208099,
    "reward_std": 0.1680975732547101,
    "timesteps": 288968535,
    "learntime": 0.1323536210693419,
    "sampletime": 8.574712560977787,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 824,
    "reward_mean": 1.9281205719505867,
    "reward_max": 2.3499879386032565,
    "reward_min": 1.590413496318633,
    "reward_std": 0.15744616168435785,
    "timesteps": 289329255,
    "learntime": 0.13134483504109085,
    "sampletime": 8.50544805591926,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 825,
    "reward_mean": 1.4513185712936973,
    "reward_max": 2.4114130908063887,
    "reward_min": -7.1218359281845185,
    "reward_std": 1.834514398885158,
    "timesteps": 289688793,
    "learntime": 0.14007198112085462,
    "sampletime": 8.437012799084187,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 826,
    "reward_mean": 1.117229984313811,
    "reward_max": 2.415434958550823,
    "reward_min": -6.956839782376352,
    "reward_std": 2.3942427820108736,
    "timesteps": 290047077,
    "learntime": 0.13614585902541876,
    "sampletime": 8.47698331810534,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 827,
    "reward_mean": 1.4763664528995961,
    "reward_max": 2.3143025573162666,
    "reward_min": -7.3647282942463725,
    "reward_std": 1.884493361896236,
    "timesteps": 290406555,
    "learntime": 0.1358870540279895,
    "sampletime": 8.377186198020354,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 828,
    "reward_mean": 1.883690469622723,
    "reward_max": 2.299250167204361,
    "reward_min": 1.497428794854907,
    "reward_std": 0.16392535539256703,
    "timesteps": 290767275,
    "learntime": 0.12741451594047248,
    "sampletime": 8.539968741126359,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 829,
    "reward_mean": 1.9113142620391876,
    "reward_max": 2.230832334287696,
    "reward_min": 1.5362990247932324,
    "reward_std": 0.16165622150055955,
    "timesteps": 291127995,
    "learntime": 0.12748711300082505,
    "sampletime": 8.530222340021282,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 830,
    "reward_mean": 1.5112120245877279,
    "reward_max": 2.463058195040722,
    "reward_min": -7.3386538730670585,
    "reward_std": 1.8325152245709528,
    "timesteps": 291487464,
    "learntime": 0.12525256210938096,
    "sampletime": 8.537794464966282,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 831,
    "reward_mean": 1.8903958485903984,
    "reward_max": 2.2113309119013085,
    "reward_min": 1.5571309398598672,
    "reward_std": 0.15011910695769848,
    "timesteps": 291848184,
    "learntime": 0.1326443669386208,
    "sampletime": 8.55889023304917,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 832,
    "reward_mean": 1.9014652066607085,
    "reward_max": 2.2222725569551005,
    "reward_min": 1.4440642798453491,
    "reward_std": 0.15974459081730047,
    "timesteps": 292208904,
    "learntime": 0.1315119289793074,
    "sampletime": 8.460746271070093,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 833,
    "reward_mean": 2.0539534855557697,
    "reward_max": 2.432215278174471,
    "reward_min": 1.6227256019831662,
    "reward_std": 0.172115671430344,
    "timesteps": 292569624,
    "learntime": 0.13437745487317443,
    "sampletime": 8.60263828211464,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 834,
    "reward_mean": 1.6082466880112618,
    "reward_max": 2.393593534858981,
    "reward_min": -6.65628275559919,
    "reward_std": 1.8200630130111441,
    "timesteps": 292929237,
    "learntime": 0.1289545411709696,
    "sampletime": 8.430751299019903,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 835,
    "reward_mean": 1.9413099440061574,
    "reward_max": 2.4267959444656597,
    "reward_min": 1.5851982392769308,
    "reward_std": 0.1732331622047143,
    "timesteps": 293289957,
    "learntime": 0.1367432631086558,
    "sampletime": 8.446459792088717,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 836,
    "reward_mean": 2.0221874834581413,
    "reward_max": 2.481827982534823,
    "reward_min": 1.5670627226530895,
    "reward_std": 0.1741395902312345,
    "timesteps": 293650677,
    "learntime": 0.1344424260314554,
    "sampletime": 8.540137929841876,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 837,
    "reward_mean": 2.075699763406102,
    "reward_max": 2.467001890290923,
    "reward_min": 1.7139135115307182,
    "reward_std": 0.1656361748997196,
    "timesteps": 294011397,
    "learntime": 0.1250186120159924,
    "sampletime": 8.616385442903265,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 838,
    "reward_mean": 1.6053573118071673,
    "reward_max": 2.3483422074544533,
    "reward_min": -6.783800875725734,
    "reward_std": 1.77979005268026,
    "timesteps": 294371037,
    "learntime": 0.12693865201435983,
    "sampletime": 8.682939133839682,
    "best_max_mean": 1.845385926277884,
    "best_max": 2.503494267680003
  },
  {
    "gen": 839,
    "reward_mean": 2.058871849499326,
    "reward_max": 2.5830753041399537,
    "reward_min": 1.693620354491884,
    "reward_std": 0.1948200089989624,
    "timesteps": 294731757,
    "learntime": 0.1356919959653169,
    "sampletime": 8.590486342087388,
    "best_max_mean": 2.058871849499326,
    "best_max": 2.5830753041399537
  },
  {
    "gen": 840,
    "reward_mean": 2.099525188525133,
    "reward_max": 2.473302725155721,
    "reward_min": 1.6885421179220872,
    "reward_std": 0.16975640964029004,
    "timesteps": 295092477,
    "learntime": 0.13787330500781536,
    "sampletime": 8.581320063909516,
    "best_max_mean": 2.058871849499326,
    "best_max": 2.5830753041399537
  },
  {
    "gen": 841,
    "reward_mean": 2.161063338618405,
    "reward_max": 2.500245796535055,
    "reward_min": 1.7743825542036715,
    "reward_std": 0.16524081117951717,
    "timesteps": 295453197,
    "learntime": 0.1717294689733535,
    "sampletime": 8.575696183834225,
    "best_max_mean": 2.058871849499326,
    "best_max": 2.5830753041399537
  },
  {
    "gen": 842,
    "reward_mean": 1.6421437512420969,
    "reward_max": 2.5130533543779148,
    "reward_min": -6.721549919413081,
    "reward_std": 1.7862085652021784,
    "timesteps": 295812744,
    "learntime": 0.13495287392288446,
    "sampletime": 8.542474105022848,
    "best_max_mean": 2.058871849499326,
    "best_max": 2.5830753041399537
  },
  {
    "gen": 843,
    "reward_mean": 1.7436608506797286,
    "reward_max": 2.7250198722450105,
    "reward_min": -6.843153235477849,
    "reward_std": 1.8513831928031677,
    "timesteps": 296172333,
    "learntime": 0.13699140888638794,
    "sampletime": 8.489444392034784,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 844,
    "reward_mean": 2.0712896209047558,
    "reward_max": 2.505011651776094,
    "reward_min": 1.5738401931170771,
    "reward_std": 0.18714050114726075,
    "timesteps": 296533053,
    "learntime": 0.14650612510740757,
    "sampletime": 8.578100292012095,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 845,
    "reward_mean": 0.4420963542186888,
    "reward_max": 2.656277758004656,
    "reward_min": -14.20844099986587,
    "reward_std": 3.6377840336073506,
    "timesteps": 296889069,
    "learntime": 0.13435140415094793,
    "sampletime": 8.558207120047882,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 846,
    "reward_mean": 1.7250031694963999,
    "reward_max": 2.588000792526693,
    "reward_min": -6.701930321195646,
    "reward_std": 1.8088248095808004,
    "timesteps": 297248526,
    "learntime": 0.13824366102926433,
    "sampletime": 8.662562279962003,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 847,
    "reward_mean": 1.3332077051663191,
    "reward_max": 2.614833053264932,
    "reward_min": -6.8166216361392875,
    "reward_std": 2.536935702897685,
    "timesteps": 297606972,
    "learntime": 0.13450703700073063,
    "sampletime": 8.665727473096922,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 848,
    "reward_mean": 0.8760961752126922,
    "reward_max": 2.638411948773862,
    "reward_min": -15.400294656641291,
    "reward_std": 3.4254093348054715,
    "timesteps": 297964233,
    "learntime": 0.13722399389371276,
    "sampletime": 8.515101971104741,
    "best_max_mean": 1.7436608506797286,
    "best_max": 2.7250198722450105
  },
  {
    "gen": 849,
    "reward_mean": 0.609930362310963,
    "reward_max": 2.8464966895399155,
    "reward_min": -6.911531994951833,
    "reward_std": 3.403068783111828,
    "timesteps": 298320180,
    "learntime": 0.12893028394319117,
    "sampletime": 8.379700835095719,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 850,
    "reward_mean": 1.7907172017515698,
    "reward_max": 2.6280875099358965,
    "reward_min": -6.420993326385295,
    "reward_std": 1.7147493924118378,
    "timesteps": 298679688,
    "learntime": 0.2157178670167923,
    "sampletime": 8.447089467896149,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 851,
    "reward_mean": 0.8293640680080099,
    "reward_max": 2.3939241692287085,
    "reward_min": -15.974180284915775,
    "reward_std": 3.4562036461137273,
    "timesteps": 299037306,
    "learntime": 0.13075844990089536,
    "sampletime": 8.477766466094181,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 852,
    "reward_mean": 0.4743980631017777,
    "reward_max": 2.50615733728751,
    "reward_min": -13.91832605101728,
    "reward_std": 3.591540831997186,
    "timesteps": 299393511,
    "learntime": 0.1414406099356711,
    "sampletime": 8.487627286929637,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 853,
    "reward_mean": 1.3600632062812217,
    "reward_max": 2.5813185490442243,
    "reward_min": -6.75414747181772,
    "reward_std": 2.532982302265576,
    "timesteps": 299752341,
    "learntime": 0.12413360690698028,
    "sampletime": 8.569724316941574,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 854,
    "reward_mean": 0.43416817898796506,
    "reward_max": 2.5354521977962095,
    "reward_min": -14.272499361405304,
    "reward_std": 3.5892058433773824,
    "timesteps": 300108474,
    "learntime": 0.13034261902794242,
    "sampletime": 8.378565389895812,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 855,
    "reward_mean": -0.3452289169972088,
    "reward_max": 2.4463979606657738,
    "reward_min": -14.097769489889393,
    "reward_std": 4.135209625575024,
    "timesteps": 300462477,
    "learntime": 0.13204900710843503,
    "sampletime": 8.552175387972966,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 856,
    "reward_mean": 0.906344291818256,
    "reward_max": 2.4684097405821124,
    "reward_min": -15.539322549143854,
    "reward_std": 3.7295536355150074,
    "timesteps": 300820401,
    "learntime": 0.12058063712902367,
    "sampletime": 8.421226494014263,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 857,
    "reward_mean": 1.4534137039757788,
    "reward_max": 2.6210208107398967,
    "reward_min": -6.620240888762942,
    "reward_std": 2.399736277054886,
    "timesteps": 301178772,
    "learntime": 0.12378833792172372,
    "sampletime": 8.458957394119352,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 858,
    "reward_mean": 0.8701813226363749,
    "reward_max": 2.55625842752973,
    "reward_min": -7.256471992341565,
    "reward_std": 3.094832970603802,
    "timesteps": 301535889,
    "learntime": 0.12776332907378674,
    "sampletime": 8.495962131069973,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 859,
    "reward_mean": 1.6504385828064407,
    "reward_max": 2.5216105806256444,
    "reward_min": -6.926422433079238,
    "reward_std": 1.8626394800651982,
    "timesteps": 301895481,
    "learntime": 0.1370008650701493,
    "sampletime": 8.57178678107448,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 860,
    "reward_mean": 0.882797794799332,
    "reward_max": 2.611978237347845,
    "reward_min": -14.389257736727211,
    "reward_std": 3.348678279016589,
    "timesteps": 302253240,
    "learntime": 0.139254858950153,
    "sampletime": 8.510022229980677,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 861,
    "reward_mean": 0.8695284155144858,
    "reward_max": 2.480150960541017,
    "reward_min": -15.32332404150282,
    "reward_std": 3.352888402710527,
    "timesteps": 302610660,
    "learntime": 0.12486324901692569,
    "sampletime": 8.414350682171062,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 862,
    "reward_mean": 0.9040167831515579,
    "reward_max": 2.4605848956540046,
    "reward_min": -6.758122408522691,
    "reward_std": 2.8953156830219213,
    "timesteps": 302967987,
    "learntime": 0.13304066797718406,
    "sampletime": 8.479342970065773,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 863,
    "reward_mean": 0.5300261619278434,
    "reward_max": 2.672355155671317,
    "reward_min": -15.539296968099238,
    "reward_std": 3.705655375361127,
    "timesteps": 303324078,
    "learntime": 0.12615516502410173,
    "sampletime": 8.391289870953187,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 864,
    "reward_mean": 1.2350794120187567,
    "reward_max": 2.4874469240121844,
    "reward_min": -7.109258984376072,
    "reward_std": 2.628222469548667,
    "timesteps": 303682272,
    "learntime": 0.1300813271664083,
    "sampletime": 8.456714380998164,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 865,
    "reward_mean": 1.6026022296112474,
    "reward_max": 2.3109644573894235,
    "reward_min": -6.816320686757648,
    "reward_std": 1.7870009161014953,
    "timesteps": 304041846,
    "learntime": 0.12285377201624215,
    "sampletime": 8.457930772798136,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 866,
    "reward_mean": 0.8326013861322914,
    "reward_max": 2.416496360154818,
    "reward_min": -7.257145586514418,
    "reward_std": 3.020678468649745,
    "timesteps": 304399008,
    "learntime": 0.1405008127912879,
    "sampletime": 8.545068088918924,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 867,
    "reward_mean": -0.14645771932697477,
    "reward_max": 2.297914377813205,
    "reward_min": -15.669267444509778,
    "reward_std": 4.515098883966518,
    "timesteps": 304754127,
    "learntime": 0.12907566595822573,
    "sampletime": 8.411914934869856,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 868,
    "reward_mean": 0.37974206505785835,
    "reward_max": 2.276291086543066,
    "reward_min": -6.806539848229897,
    "reward_std": 3.2982106797251847,
    "timesteps": 305110401,
    "learntime": 0.1306552740279585,
    "sampletime": 8.484036691952497,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 869,
    "reward_mean": 1.8910009280270712,
    "reward_max": 2.27711319873823,
    "reward_min": 1.490245589977622,
    "reward_std": 0.1755790050177676,
    "timesteps": 305471121,
    "learntime": 0.1389623018912971,
    "sampletime": 8.53532840590924,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 870,
    "reward_mean": 1.11146437048995,
    "reward_max": 2.4293414529899784,
    "reward_min": -6.9175709397779,
    "reward_std": 2.4983818636505193,
    "timesteps": 305829579,
    "learntime": 0.14627687982283533,
    "sampletime": 8.530603480059654,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 871,
    "reward_mean": 1.810661224035487,
    "reward_max": 2.1509326319774638,
    "reward_min": 1.2523892453084964,
    "reward_std": 0.18885048035008492,
    "timesteps": 306190299,
    "learntime": 0.1297403951175511,
    "sampletime": 8.544341661036015,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 872,
    "reward_mean": 1.0546806374589748,
    "reward_max": 2.212530157292458,
    "reward_min": -7.180692963767796,
    "reward_std": 2.5299104808416306,
    "timesteps": 306548889,
    "learntime": 0.1401801290921867,
    "sampletime": 8.601852163905278,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 873,
    "reward_mean": 1.5471024640876134,
    "reward_max": 2.382624694620695,
    "reward_min": -7.062398154393042,
    "reward_std": 1.8495877505417784,
    "timesteps": 306908475,
    "learntime": 0.13278989703394473,
    "sampletime": 8.678455577930436,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 874,
    "reward_mean": 1.5078702261743906,
    "reward_max": 2.3924398595448677,
    "reward_min": -7.260111661798985,
    "reward_std": 1.8078844855938738,
    "timesteps": 307267932,
    "learntime": 0.13910049898549914,
    "sampletime": 8.47479254892096,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 875,
    "reward_mean": 1.4568523845799524,
    "reward_max": 2.227306436473911,
    "reward_min": -7.297702891286465,
    "reward_std": 1.887403073927811,
    "timesteps": 307627587,
    "learntime": 0.131520280148834,
    "sampletime": 8.566024363040924,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 876,
    "reward_mean": 1.4913787630760418,
    "reward_max": 2.319965445397729,
    "reward_min": -14.386652647370484,
    "reward_std": 2.3076362414571934,
    "timesteps": 307987059,
    "learntime": 0.1339443470351398,
    "sampletime": 8.517240724992007,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 877,
    "reward_mean": 1.460581928097632,
    "reward_max": 2.108391656843715,
    "reward_min": -6.308328171507232,
    "reward_std": 1.7068767880269506,
    "timesteps": 308346618,
    "learntime": 0.13189319986850023,
    "sampletime": 8.492271173978224,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 878,
    "reward_mean": 1.3957040602804565,
    "reward_max": 2.1357247686039145,
    "reward_min": -7.063218507167858,
    "reward_std": 1.828208948321239,
    "timesteps": 308706168,
    "learntime": 0.1238998759072274,
    "sampletime": 8.597128038061783,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 879,
    "reward_mean": 1.3858774869620605,
    "reward_max": 2.11645152223663,
    "reward_min": -7.141499293562173,
    "reward_std": 1.8614105381586556,
    "timesteps": 309065736,
    "learntime": 0.13231586595065892,
    "sampletime": 8.50955255003646,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 880,
    "reward_mean": 1.7217599207417216,
    "reward_max": 2.060117844549633,
    "reward_min": 1.3158254536789469,
    "reward_std": 0.16762584293405858,
    "timesteps": 309426456,
    "learntime": 0.13165120617486537,
    "sampletime": 8.61989460606128,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 881,
    "reward_mean": 1.8599037029978946,
    "reward_max": 2.127654957355733,
    "reward_min": 1.5992660960111964,
    "reward_std": 0.13546786992117846,
    "timesteps": 309787176,
    "learntime": 0.13348959293216467,
    "sampletime": 8.532475715037435,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 882,
    "reward_mean": 1.7727908635024436,
    "reward_max": 2.116386685132358,
    "reward_min": 1.5194960856734325,
    "reward_std": 0.1412236686599556,
    "timesteps": 310147896,
    "learntime": 0.13598806713707745,
    "sampletime": 8.67666688002646,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 883,
    "reward_mean": 1.7600646096906454,
    "reward_max": 2.1424999224096086,
    "reward_min": 1.380037654240201,
    "reward_std": 0.16344875834951592,
    "timesteps": 310508616,
    "learntime": 0.13025630288757384,
    "sampletime": 8.518026906996965,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 884,
    "reward_mean": 1.7954969357897363,
    "reward_max": 2.1670845189188213,
    "reward_min": 1.4021742535035353,
    "reward_std": 0.1518926475650741,
    "timesteps": 310869336,
    "learntime": 0.13077439600601792,
    "sampletime": 8.562045458005741,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 885,
    "reward_mean": 1.7751210565670807,
    "reward_max": 2.0552119750557742,
    "reward_min": 1.441251939040022,
    "reward_std": 0.11818278191568728,
    "timesteps": 311230056,
    "learntime": 0.13021669001318514,
    "sampletime": 8.680970628047362,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 886,
    "reward_mean": 1.494912201628548,
    "reward_max": 2.284627372948854,
    "reward_min": -7.065968682881887,
    "reward_std": 1.7738922287166563,
    "timesteps": 311589744,
    "learntime": 0.1328335888683796,
    "sampletime": 8.497812756104395,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 887,
    "reward_mean": 1.7707761897523944,
    "reward_max": 2.1003940026866696,
    "reward_min": 1.3347912791747734,
    "reward_std": 0.17890450812164618,
    "timesteps": 311950464,
    "learntime": 0.13706835894845426,
    "sampletime": 8.564727760152891,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 888,
    "reward_mean": 1.873245440594296,
    "reward_max": 2.2067037372180454,
    "reward_min": 1.6327084315214015,
    "reward_std": 0.13480469040154755,
    "timesteps": 312311184,
    "learntime": 0.13584152213297784,
    "sampletime": 8.519942712038755,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 889,
    "reward_mean": 1.8541960657899887,
    "reward_max": 2.097647182194507,
    "reward_min": 1.4884096005636898,
    "reward_std": 0.14017539099888285,
    "timesteps": 312671904,
    "learntime": 0.13368310406804085,
    "sampletime": 8.740320438984782,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 890,
    "reward_mean": 1.9028478207859558,
    "reward_max": 2.177001765296557,
    "reward_min": 1.5402455048760815,
    "reward_std": 0.13448820006077145,
    "timesteps": 313032624,
    "learntime": 0.1408823688980192,
    "sampletime": 8.605341293849051,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 891,
    "reward_mean": 1.8129558020972723,
    "reward_max": 2.247142902353184,
    "reward_min": 1.4068863724612353,
    "reward_std": 0.16012780806103105,
    "timesteps": 313393344,
    "learntime": 0.13568669091910124,
    "sampletime": 8.563864754047245,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 892,
    "reward_mean": 1.8878439111179042,
    "reward_max": 2.2064739368577233,
    "reward_min": 1.6202417536564573,
    "reward_std": 0.12821951270170007,
    "timesteps": 313754064,
    "learntime": 0.13203892321325839,
    "sampletime": 8.573363346979022,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 893,
    "reward_mean": -0.9253925301115015,
    "reward_max": 2.280452378362743,
    "reward_min": -56.831721688177716,
    "reward_std": 7.957965060816822,
    "timesteps": 314105685,
    "learntime": 0.13031102484092116,
    "sampletime": 8.645100333029404,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 894,
    "reward_mean": 1.4658563007351297,
    "reward_max": 2.2435508981227117,
    "reward_min": -7.655066891044213,
    "reward_std": 1.9786693603663843,
    "timesteps": 314465121,
    "learntime": 0.13356561306864023,
    "sampletime": 8.534327170113102,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 895,
    "reward_mean": 1.863021928678645,
    "reward_max": 2.318888994806911,
    "reward_min": 1.4215979442550697,
    "reward_std": 0.1730901324708495,
    "timesteps": 314825841,
    "learntime": 0.13615146419033408,
    "sampletime": 8.629577166866511,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 896,
    "reward_mean": 1.5639937289532808,
    "reward_max": 2.285754692077522,
    "reward_min": -6.525448764983595,
    "reward_std": 1.776766728252857,
    "timesteps": 315185226,
    "learntime": 0.13155564502812922,
    "sampletime": 8.527494260808453,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 897,
    "reward_mean": 1.1692865257500111,
    "reward_max": 2.27332290523389,
    "reward_min": -16.320014915806524,
    "reward_std": 3.070871620147353,
    "timesteps": 315543450,
    "learntime": 0.13279504398815334,
    "sampletime": 8.497494635172188,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 898,
    "reward_mean": 1.5430962975945826,
    "reward_max": 2.3161090923716623,
    "reward_min": -7.562922085748252,
    "reward_std": 1.9941556440393573,
    "timesteps": 315902865,
    "learntime": 0.1344286659732461,
    "sampletime": 8.536575766047463,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 899,
    "reward_mean": 1.8823631835892942,
    "reward_max": 2.2284670597556127,
    "reward_min": 1.1157955496896472,
    "reward_std": 0.20923515140251997,
    "timesteps": 316263585,
    "learntime": 0.13181226793676615,
    "sampletime": 8.568591444985941,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 900,
    "reward_mean": -0.5191038597549401,
    "reward_max": 2.2116967868668387,
    "reward_min": -44.07778995823306,
    "reward_std": 6.496385161662748,
    "timesteps": 316616733,
    "learntime": 0.14114777790382504,
    "sampletime": 8.43970697792247,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 901,
    "reward_mean": -0.2580671872856282,
    "reward_max": 2.2078615737356633,
    "reward_min": -43.75972524387092,
    "reward_std": 6.555402102867387,
    "timesteps": 316970952,
    "learntime": 0.13070087786763906,
    "sampletime": 8.393810681067407,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 902,
    "reward_mean": 1.5047976691206648,
    "reward_max": 2.1742600308657094,
    "reward_min": -7.296025348516005,
    "reward_std": 1.915349246746754,
    "timesteps": 317330349,
    "learntime": 0.13158463081344962,
    "sampletime": 8.559256627922878,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 903,
    "reward_mean": -1.5031934997543783,
    "reward_max": 2.318348745737844,
    "reward_min": -25.683617643933484,
    "reward_std": 6.353584687242934,
    "timesteps": 317680812,
    "learntime": 0.13989772787317634,
    "sampletime": 8.424356044037268,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 904,
    "reward_mean": -4.015042976851546,
    "reward_max": 2.2623273185560118,
    "reward_min": -44.372904056946886,
    "reward_std": 9.39742511094861,
    "timesteps": 318023415,
    "learntime": 0.12975455890409648,
    "sampletime": 8.215916082030162,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 905,
    "reward_mean": -1.4929028276860767,
    "reward_max": 2.1564008814307387,
    "reward_min": -72.46407372292103,
    "reward_std": 9.87810406792208,
    "timesteps": 318373584,
    "learntime": 0.13933178293518722,
    "sampletime": 8.320363306906074,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 906,
    "reward_mean": -1.9063962475030407,
    "reward_max": 2.2443087559870682,
    "reward_min": -44.216999720366665,
    "reward_std": 7.719156407285215,
    "timesteps": 318722589,
    "learntime": 0.1309317520353943,
    "sampletime": 8.264119869098067,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 907,
    "reward_mean": 1.8994953739708127,
    "reward_max": 2.1995664872358427,
    "reward_min": 1.4740510514218625,
    "reward_std": 0.14361598094222383,
    "timesteps": 319083309,
    "learntime": 0.1465233308263123,
    "sampletime": 8.638954580994323,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 908,
    "reward_mean": 0.1175346512578049,
    "reward_max": 2.1577123437274373,
    "reward_min": -16.82008701049243,
    "reward_std": 3.934855737513783,
    "timesteps": 319438995,
    "learntime": 0.1312500408384949,
    "sampletime": 8.505379348993301,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 909,
    "reward_mean": 1.1310858596988496,
    "reward_max": 2.422293585773633,
    "reward_min": -7.42556560804334,
    "reward_std": 2.7151277567553262,
    "timesteps": 319797054,
    "learntime": 0.1409864730667323,
    "sampletime": 8.467417093925178,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 910,
    "reward_mean": 0.64459238177705,
    "reward_max": 2.2243873908753584,
    "reward_min": -25.362886816065647,
    "reward_std": 4.159351274903119,
    "timesteps": 320154123,
    "learntime": 0.13748248596675694,
    "sampletime": 8.472974899923429,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 911,
    "reward_mean": 1.9505512289057891,
    "reward_max": 2.351912458546307,
    "reward_min": 1.6997304065940104,
    "reward_std": 0.141019842736662,
    "timesteps": 320514843,
    "learntime": 0.13813728699460626,
    "sampletime": 8.549063267186284,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 912,
    "reward_mean": 1.5772551426019876,
    "reward_max": 2.282010170348886,
    "reward_min": -6.947116827682214,
    "reward_std": 1.838333778969378,
    "timesteps": 320874501,
    "learntime": 0.13555816910229623,
    "sampletime": 8.603426335845143,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 913,
    "reward_mean": 2.024884952341532,
    "reward_max": 2.4394030203552415,
    "reward_min": 1.7932516424281666,
    "reward_std": 0.12662549103732287,
    "timesteps": 321235221,
    "learntime": 0.14417169988155365,
    "sampletime": 8.582381795160472,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 914,
    "reward_mean": 1.6008470518326288,
    "reward_max": 2.4776597512871796,
    "reward_min": -7.312587509563226,
    "reward_std": 1.9536801579381264,
    "timesteps": 321594615,
    "learntime": 0.1348712278995663,
    "sampletime": 8.56668334105052,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 915,
    "reward_mean": 1.5782389965570978,
    "reward_max": 2.3375191012235117,
    "reward_min": -6.967821647383091,
    "reward_std": 1.8602618089372929,
    "timesteps": 321954165,
    "learntime": 0.13595148804597557,
    "sampletime": 8.467545042047277,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 916,
    "reward_mean": 1.986790209769965,
    "reward_max": 2.248539067820685,
    "reward_min": 1.754539182490781,
    "reward_std": 0.10407720846158905,
    "timesteps": 322314885,
    "learntime": 0.1353953129146248,
    "sampletime": 8.629309793002903,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 917,
    "reward_mean": 2.018658341234973,
    "reward_max": 2.515531743475353,
    "reward_min": 1.6775388396309774,
    "reward_std": 0.17843611564718811,
    "timesteps": 322675605,
    "learntime": 0.13826323207467794,
    "sampletime": 8.549538047984242,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 918,
    "reward_mean": 1.9628089949694678,
    "reward_max": 2.3438891331527625,
    "reward_min": 1.5779768539424452,
    "reward_std": 0.15679342947549435,
    "timesteps": 323036325,
    "learntime": 0.12681613396853209,
    "sampletime": 8.659439423820004,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 919,
    "reward_mean": 1.5910505524237848,
    "reward_max": 2.3798585048465997,
    "reward_min": -6.9285637952826535,
    "reward_std": 1.771792877415144,
    "timesteps": 323395863,
    "learntime": 0.13179606688208878,
    "sampletime": 8.509238809114322,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 920,
    "reward_mean": 1.9894247923112132,
    "reward_max": 2.296210965804425,
    "reward_min": 1.6553994025796912,
    "reward_std": 0.13075013104720853,
    "timesteps": 323756583,
    "learntime": 0.13431249698624015,
    "sampletime": 8.601045081857592,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 921,
    "reward_mean": 1.9790452246230033,
    "reward_max": 2.2944813096740564,
    "reward_min": 1.7190764889934185,
    "reward_std": 0.11163915164623055,
    "timesteps": 324117303,
    "learntime": 0.13507293607108295,
    "sampletime": 8.60119773610495,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 922,
    "reward_mean": 2.037909726754277,
    "reward_max": 2.3387314781747643,
    "reward_min": 1.6213703611154184,
    "reward_std": 0.13322580950416812,
    "timesteps": 324478023,
    "learntime": 0.1381100460421294,
    "sampletime": 8.52853710995987,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 923,
    "reward_mean": 2.0079925738373525,
    "reward_max": 2.3305904760455785,
    "reward_min": 1.5897392531844516,
    "reward_std": 0.14605612797077538,
    "timesteps": 324838743,
    "learntime": 0.13172512291930616,
    "sampletime": 8.618275105953217,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 924,
    "reward_mean": 1.988470646265514,
    "reward_max": 2.277919569621159,
    "reward_min": 1.641324087253855,
    "reward_std": 0.1428959972658094,
    "timesteps": 325199463,
    "learntime": 0.13097626389935613,
    "sampletime": 8.574169856030494,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 925,
    "reward_mean": 1.9461328579292738,
    "reward_max": 2.181039463954439,
    "reward_min": 1.7219470524781173,
    "reward_std": 0.12314249424996096,
    "timesteps": 325560183,
    "learntime": 0.13237397302873433,
    "sampletime": 8.5472410840448,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 926,
    "reward_mean": 1.5685182496988936,
    "reward_max": 2.212847539755534,
    "reward_min": -6.687215867521997,
    "reward_std": 1.7747033776011711,
    "timesteps": 325919730,
    "learntime": 0.13335848413407803,
    "sampletime": 8.649767386028543,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 927,
    "reward_mean": 1.9901606215691863,
    "reward_max": 2.222145019581973,
    "reward_min": 1.662865197711099,
    "reward_std": 0.13538457154527184,
    "timesteps": 326280450,
    "learntime": 0.13722518202848732,
    "sampletime": 8.529286639997736,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 928,
    "reward_mean": 2.0036273539674743,
    "reward_max": 2.2890087677609907,
    "reward_min": 1.6339615462334613,
    "reward_std": 0.15332101566591352,
    "timesteps": 326641170,
    "learntime": 0.13657840597443283,
    "sampletime": 8.594186183996499,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 929,
    "reward_mean": 1.9847013593762015,
    "reward_max": 2.2211340597455567,
    "reward_min": 1.7147502720595844,
    "reward_std": 0.11312628499417207,
    "timesteps": 327001890,
    "learntime": 0.12955220718868077,
    "sampletime": 8.557601912179962,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 930,
    "reward_mean": 1.9913568717313692,
    "reward_max": 2.333845837006162,
    "reward_min": 1.6394861769028148,
    "reward_std": 0.13154387372404885,
    "timesteps": 327362610,
    "learntime": 0.14433645992539823,
    "sampletime": 8.54457170702517,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 931,
    "reward_mean": 1.8892412635377405,
    "reward_max": 2.1715567920896706,
    "reward_min": 1.5633839559902993,
    "reward_std": 0.134003678341809,
    "timesteps": 327723330,
    "learntime": 0.13855481194332242,
    "sampletime": 8.604503042064607,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 932,
    "reward_mean": 1.9715837546563217,
    "reward_max": 2.3835490131662485,
    "reward_min": 1.5802867794920894,
    "reward_std": 0.1670336476234922,
    "timesteps": 328084050,
    "learntime": 0.13422062410973012,
    "sampletime": 8.55365584907122,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 933,
    "reward_mean": 1.9196771591264765,
    "reward_max": 2.2794922597980363,
    "reward_min": 1.643819470748754,
    "reward_std": 0.12484688335177059,
    "timesteps": 328444770,
    "learntime": 0.1320181949995458,
    "sampletime": 8.552754114149138,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 934,
    "reward_mean": 1.9828537070078012,
    "reward_max": 2.4941554930725633,
    "reward_min": 1.5327499322152205,
    "reward_std": 0.172873716412773,
    "timesteps": 328805490,
    "learntime": 0.13753990200348198,
    "sampletime": 8.513155224965885,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 935,
    "reward_mean": 1.5465501656633598,
    "reward_max": 2.2908226255517383,
    "reward_min": -8.041191771686446,
    "reward_std": 1.9927559117930034,
    "timesteps": 329164851,
    "learntime": 0.14544854988344014,
    "sampletime": 8.679861592128873,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 936,
    "reward_mean": 1.9923708280431978,
    "reward_max": 2.376214143308582,
    "reward_min": 1.6416084975794407,
    "reward_std": 0.1387512041067656,
    "timesteps": 329525571,
    "learntime": 0.12882661493495107,
    "sampletime": 8.564455865882337,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 937,
    "reward_mean": 1.9620739046658342,
    "reward_max": 2.231287519052985,
    "reward_min": 1.6200943371725496,
    "reward_std": 0.13401354998709064,
    "timesteps": 329886291,
    "learntime": 0.13933068979531527,
    "sampletime": 8.53381032589823,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 938,
    "reward_mean": 1.9779234690031504,
    "reward_max": 2.3240484799612022,
    "reward_min": 1.5957576725279161,
    "reward_std": 0.13522035693124368,
    "timesteps": 330247011,
    "learntime": 0.13689223607070744,
    "sampletime": 8.684630362084135,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 939,
    "reward_mean": 2.0188424576488697,
    "reward_max": 2.3652269430211557,
    "reward_min": 1.6222657577653221,
    "reward_std": 0.12892341482743105,
    "timesteps": 330607731,
    "learntime": 0.13260448700748384,
    "sampletime": 8.491430790163577,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 940,
    "reward_mean": 1.995154664904311,
    "reward_max": 2.2174293193278958,
    "reward_min": 1.6528303432243048,
    "reward_std": 0.13632525119838276,
    "timesteps": 330968451,
    "learntime": 0.13738745590671897,
    "sampletime": 8.490829499904066,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 941,
    "reward_mean": 1.9896082243383533,
    "reward_max": 2.228838109488907,
    "reward_min": 1.6616489591791472,
    "reward_std": 0.12346900762349271,
    "timesteps": 331329171,
    "learntime": 0.13703901111148298,
    "sampletime": 8.539611635962501,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 942,
    "reward_mean": 2.0084857138792658,
    "reward_max": 2.3792790775187287,
    "reward_min": 1.7133832229301305,
    "reward_std": 0.1357014472226384,
    "timesteps": 331689891,
    "learntime": 0.13230679696425796,
    "sampletime": 8.692971657030284,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 943,
    "reward_mean": 1.9950088059332596,
    "reward_max": 2.3619794975736896,
    "reward_min": 1.6763961349409326,
    "reward_std": 0.15226905934413668,
    "timesteps": 332050611,
    "learntime": 0.1287192429881543,
    "sampletime": 8.651632135966793,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 944,
    "reward_mean": 2.0626108539604138,
    "reward_max": 2.374027192571452,
    "reward_min": 1.5963723210496163,
    "reward_std": 0.12960981907290997,
    "timesteps": 332411331,
    "learntime": 0.13432746496982872,
    "sampletime": 8.59633665299043,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 945,
    "reward_mean": 2.0165286646936043,
    "reward_max": 2.4123871627433027,
    "reward_min": 1.7012952144017819,
    "reward_std": 0.13890309633277861,
    "timesteps": 332772051,
    "learntime": 0.1420553510542959,
    "sampletime": 8.572500946931541,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 946,
    "reward_mean": 2.038630036528767,
    "reward_max": 2.3236621988824364,
    "reward_min": 1.5709779976565494,
    "reward_std": 0.12563676179900704,
    "timesteps": 333132771,
    "learntime": 0.1433181739412248,
    "sampletime": 8.647027658997104,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 947,
    "reward_mean": 1.9971177228574823,
    "reward_max": 2.2937944963059347,
    "reward_min": 1.5621371760216471,
    "reward_std": 0.1460052448869989,
    "timesteps": 333493491,
    "learntime": 0.1384372499305755,
    "sampletime": 8.6735394441057,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 948,
    "reward_mean": 2.0333405218810596,
    "reward_max": 2.440215555030257,
    "reward_min": 1.7838726877411248,
    "reward_std": 0.13851125494427652,
    "timesteps": 333854211,
    "learntime": 0.1299785589799285,
    "sampletime": 8.618668937124312,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 949,
    "reward_mean": 2.1067309288949843,
    "reward_max": 2.3901355440065126,
    "reward_min": 1.6215671880856823,
    "reward_std": 0.14558196820037053,
    "timesteps": 334214931,
    "learntime": 0.13566864700987935,
    "sampletime": 8.576928271912038,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 950,
    "reward_mean": 1.9957705745704333,
    "reward_max": 2.3953897324108473,
    "reward_min": 1.778172024116483,
    "reward_std": 0.11905145545863127,
    "timesteps": 334575651,
    "learntime": 0.14596823789179325,
    "sampletime": 8.679986758856103,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 951,
    "reward_mean": 2.0448437996133926,
    "reward_max": 2.2822330567851723,
    "reward_min": 1.813269284262785,
    "reward_std": 0.12595045182927822,
    "timesteps": 334936371,
    "learntime": 0.13857959699817002,
    "sampletime": 8.65784468385391,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 952,
    "reward_mean": 2.0668231992114574,
    "reward_max": 2.4950151755968384,
    "reward_min": 1.7871402792754267,
    "reward_std": 0.13419370973009645,
    "timesteps": 335297091,
    "learntime": 0.12753304187208414,
    "sampletime": 8.528238686034456,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 953,
    "reward_mean": 2.067277340961052,
    "reward_max": 2.415330833684876,
    "reward_min": 1.8500947224877577,
    "reward_std": 0.1146186219334248,
    "timesteps": 335657811,
    "learntime": 0.13307616184465587,
    "sampletime": 8.532335914904252,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 954,
    "reward_mean": 2.043061486483447,
    "reward_max": 2.371373719444044,
    "reward_min": 1.7775155035196795,
    "reward_std": 0.134130242662189,
    "timesteps": 336018531,
    "learntime": 0.13764713611453772,
    "sampletime": 8.590246772859246,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 955,
    "reward_mean": 2.050363006207376,
    "reward_max": 2.37344357548246,
    "reward_min": 1.8124697844914095,
    "reward_std": 0.10282945779840127,
    "timesteps": 336379251,
    "learntime": 0.13000672403723001,
    "sampletime": 8.55959857115522,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 956,
    "reward_mean": 2.036481311544003,
    "reward_max": 2.269638788004431,
    "reward_min": 1.7278140992099027,
    "reward_std": 0.10998657450593648,
    "timesteps": 336739971,
    "learntime": 0.13814708404242992,
    "sampletime": 8.572057609912008,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 957,
    "reward_mean": 2.0402857571172075,
    "reward_max": 2.428110061915393,
    "reward_min": 1.623674421313667,
    "reward_std": 0.17148520247734228,
    "timesteps": 337100691,
    "learntime": 0.12849628180265427,
    "sampletime": 8.6645183339715,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 958,
    "reward_mean": 2.0121331243252993,
    "reward_max": 2.2265782781482395,
    "reward_min": 1.7147443634158746,
    "reward_std": 0.10569031607170803,
    "timesteps": 337461411,
    "learntime": 0.1421641749329865,
    "sampletime": 8.597589421086013,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 959,
    "reward_mean": 2.0018098679187695,
    "reward_max": 2.3258247434083956,
    "reward_min": 1.7741231458472357,
    "reward_std": 0.11509055857083243,
    "timesteps": 337822131,
    "learntime": 0.12740078498609364,
    "sampletime": 8.512320574140176,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 960,
    "reward_mean": 2.0183192802002026,
    "reward_max": 2.56124448671471,
    "reward_min": 1.6841434337547965,
    "reward_std": 0.1570147541150763,
    "timesteps": 338182851,
    "learntime": 0.12361057917587459,
    "sampletime": 8.463249843101948,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 961,
    "reward_mean": 2.070941188531805,
    "reward_max": 2.4451134699063677,
    "reward_min": 1.8035720478117978,
    "reward_std": 0.1369739753987854,
    "timesteps": 338543571,
    "learntime": 0.14546719403006136,
    "sampletime": 8.579075217014179,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 962,
    "reward_mean": 0.7756082895352225,
    "reward_max": 2.3531764836868985,
    "reward_min": -14.921064866310594,
    "reward_std": 3.404060001330503,
    "timesteps": 338900286,
    "learntime": 0.13991995807737112,
    "sampletime": 8.623815187020227,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 963,
    "reward_mean": 1.967920462843845,
    "reward_max": 2.307458258880421,
    "reward_min": 1.593531846033519,
    "reward_std": 0.1389454113463928,
    "timesteps": 339261006,
    "learntime": 0.1368470098823309,
    "sampletime": 8.477878276957199,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 964,
    "reward_mean": 2.0383743033126365,
    "reward_max": 2.3107506407311886,
    "reward_min": 1.7756798632670474,
    "reward_std": 0.11377524910974551,
    "timesteps": 339621726,
    "learntime": 0.12907293601892889,
    "sampletime": 8.600962659111246,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 965,
    "reward_mean": 2.008230099689332,
    "reward_max": 2.482559964422963,
    "reward_min": 1.7756785894546019,
    "reward_std": 0.13453549074421148,
    "timesteps": 339982446,
    "learntime": 0.13322437112219632,
    "sampletime": 8.536198384128511,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 966,
    "reward_mean": 0.7755027494900333,
    "reward_max": 2.45222417514235,
    "reward_min": -23.394125924704394,
    "reward_std": 3.9809449622718254,
    "timesteps": 340339149,
    "learntime": 0.13959550601430237,
    "sampletime": 8.450417225016281,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 967,
    "reward_mean": 2.0091464197966733,
    "reward_max": 2.280471598121835,
    "reward_min": 1.7370233467822371,
    "reward_std": 0.11097077265913274,
    "timesteps": 340699869,
    "learntime": 0.12995545496232808,
    "sampletime": 8.670263986103237,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 968,
    "reward_mean": 0.025532419974485743,
    "reward_max": 2.4749054441993135,
    "reward_min": -48.56665675437156,
    "reward_std": 7.059927386206668,
    "timesteps": 341053947,
    "learntime": 0.13145123701542616,
    "sampletime": 8.444936570944265,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 969,
    "reward_mean": -0.06474283916289925,
    "reward_max": 2.407849629037727,
    "reward_min": -25.70871177985629,
    "reward_std": 5.086232614007527,
    "timesteps": 341408025,
    "learntime": 0.12834271392785013,
    "sampletime": 8.495871757157147,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 970,
    "reward_mean": 2.037130350335959,
    "reward_max": 2.298530539556142,
    "reward_min": 1.6187261039297212,
    "reward_std": 0.1321286332306511,
    "timesteps": 341768745,
    "learntime": 0.13456554082222283,
    "sampletime": 8.52045983611606,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 971,
    "reward_mean": -0.4869551933900923,
    "reward_max": 2.2948474192385064,
    "reward_min": -34.653691877689475,
    "reward_std": 6.093628807006116,
    "timesteps": 342121758,
    "learntime": 0.12864949088543653,
    "sampletime": 8.52975358394906,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 972,
    "reward_mean": 1.9891446913980573,
    "reward_max": 2.4370883073782093,
    "reward_min": 1.6483893601795274,
    "reward_std": 0.15418712721858355,
    "timesteps": 342482478,
    "learntime": 0.12865285598672926,
    "sampletime": 8.48780611390248,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 973,
    "reward_mean": 1.515174220319939,
    "reward_max": 2.2043726150736647,
    "reward_min": -7.544031322686794,
    "reward_std": 1.9706988923701019,
    "timesteps": 342841866,
    "learntime": 0.13875584793277085,
    "sampletime": 8.45995900593698,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 974,
    "reward_mean": 2.018874720752273,
    "reward_max": 2.3745882854528797,
    "reward_min": 1.5371209103984484,
    "reward_std": 0.1847771354413393,
    "timesteps": 343202586,
    "learntime": 0.13289428898133337,
    "sampletime": 8.619486167095602,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 975,
    "reward_mean": 2.050478381576055,
    "reward_max": 2.37728013267747,
    "reward_min": 1.8163877623508453,
    "reward_std": 0.1273262698586842,
    "timesteps": 343563306,
    "learntime": 0.1407002629712224,
    "sampletime": 8.618249675026163,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 976,
    "reward_mean": 1.6493230194638153,
    "reward_max": 2.5705060435910547,
    "reward_min": -7.335942272280318,
    "reward_std": 1.9405712802754498,
    "timesteps": 343922697,
    "learntime": 0.13346105488017201,
    "sampletime": 8.787483491003513,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 977,
    "reward_mean": 2.0401918993125916,
    "reward_max": 2.3543599326812608,
    "reward_min": 1.7500549141194706,
    "reward_std": 0.12048883717712092,
    "timesteps": 344283417,
    "learntime": 0.133895724080503,
    "sampletime": 8.550650449935347,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 978,
    "reward_mean": 0.355239651138657,
    "reward_max": 2.6956026499498273,
    "reward_min": -31.930194234422142,
    "reward_std": 5.054353878413024,
    "timesteps": 344638818,
    "learntime": 0.12831053300760686,
    "sampletime": 8.340385823044926,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 979,
    "reward_mean": 1.6315889245963813,
    "reward_max": 2.4899843045030545,
    "reward_min": -6.796942216083125,
    "reward_std": 1.8223879641358165,
    "timesteps": 344998350,
    "learntime": 0.13159219198860228,
    "sampletime": 8.463311803992838,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 980,
    "reward_mean": 2.0731866687982574,
    "reward_max": 2.5546710248325097,
    "reward_min": 1.6219151247102557,
    "reward_std": 0.1764038768921995,
    "timesteps": 345359070,
    "learntime": 0.14087239699438214,
    "sampletime": 8.643461772007868,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 981,
    "reward_mean": 2.1000777883152795,
    "reward_max": 2.6728436180415085,
    "reward_min": 1.5810760000269044,
    "reward_std": 0.19319982589449997,
    "timesteps": 345719790,
    "learntime": 0.12733025010675192,
    "sampletime": 8.53956155385822,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 982,
    "reward_mean": 1.9827050224086862,
    "reward_max": 2.3730910752377805,
    "reward_min": 1.6081922223339908,
    "reward_std": 0.1537302335755485,
    "timesteps": 346080510,
    "learntime": 0.13604773697443306,
    "sampletime": 8.557540348963812,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 983,
    "reward_mean": 2.073521373468882,
    "reward_max": 2.3789202620550456,
    "reward_min": 1.7333608702421308,
    "reward_std": 0.16365854139568947,
    "timesteps": 346441230,
    "learntime": 0.12749885697849095,
    "sampletime": 8.580142353894189,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 984,
    "reward_mean": 1.370767082182955,
    "reward_max": 2.6974022518123864,
    "reward_min": -6.765358581961749,
    "reward_std": 2.5613363016606026,
    "timesteps": 346799703,
    "learntime": 0.13169811107218266,
    "sampletime": 8.507478354033083,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 985,
    "reward_mean": 1.7010666763350468,
    "reward_max": 2.6968377327106645,
    "reward_min": -6.972954729757148,
    "reward_std": 1.8223892823399208,
    "timesteps": 347159649,
    "learntime": 0.13905229489319026,
    "sampletime": 8.526216997066513,
    "best_max_mean": 0.609930362310963,
    "best_max": 2.8464966895399155
  },
  {
    "gen": 986,
    "reward_mean": 0.21908888634454277,
    "reward_max": 3.0247728231382394,
    "reward_min": -43.293180519441556,
    "reward_std": 6.503788240962341,
    "timesteps": 347513823,
    "learntime": 0.13928057393059134,
    "sampletime": 8.438598353182897,
    "best_max_mean": 0.21908888634454277,
    "best_max": 3.0247728231382394
  },
  {
    "gen": 987,
    "reward_mean": 2.221008461714275,
    "reward_max": 2.7665517764875047,
    "reward_min": 1.8077450058542888,
    "reward_std": 0.23423394069410705,
    "timesteps": 347874543,
    "learntime": 0.13627752987667918,
    "sampletime": 8.61885311990045,
    "best_max_mean": 0.21908888634454277,
    "best_max": 3.0247728231382394
  },
  {
    "gen": 988,
    "reward_mean": 1.761744857456289,
    "reward_max": 3.0462437489662637,
    "reward_min": -7.519939049644041,
    "reward_std": 1.9330622220985694,
    "timesteps": 348234621,
    "learntime": 0.13185284193605185,
    "sampletime": 8.513400563038886,
    "best_max_mean": 1.761744857456289,
    "best_max": 3.0462437489662637
  },
  {
    "gen": 989,
    "reward_mean": 2.2967302355793926,
    "reward_max": 2.779941788878093,
    "reward_min": 1.7830589912999912,
    "reward_std": 0.22832840648933783,
    "timesteps": 348595341,
    "learntime": 0.17910937080159783,
    "sampletime": 8.529871864942834,
    "best_max_mean": 1.761744857456289,
    "best_max": 3.0462437489662637
  },
  {
    "gen": 990,
    "reward_mean": 2.2407494287564713,
    "reward_max": 2.8782800980972927,
    "reward_min": 1.8528144366173345,
    "reward_std": 0.23630007699592487,
    "timesteps": 348956061,
    "learntime": 0.13617038703523576,
    "sampletime": 8.63866091100499,
    "best_max_mean": 1.761744857456289,
    "best_max": 3.0462437489662637
  },
  {
    "gen": 991,
    "reward_mean": 2.3979669700965105,
    "reward_max": 3.354699164844172,
    "reward_min": 1.8048902262946458,
    "reward_std": 0.3527277997379734,
    "timesteps": 349316781,
    "learntime": 0.19857020396739244,
    "sampletime": 8.5791264208965,
    "best_max_mean": 2.3979669700965105,
    "best_max": 3.354699164844172
  },
  {
    "gen": 992,
    "reward_mean": 2.5810795025413036,
    "reward_max": 3.6058097556762516,
    "reward_min": 1.8261816850157815,
    "reward_std": 0.40038551050427723,
    "timesteps": 349677501,
    "learntime": 0.14180656289681792,
    "sampletime": 8.694782214006409,
    "best_max_mean": 2.5810795025413036,
    "best_max": 3.6058097556762516
  },
  {
    "gen": 993,
    "reward_mean": 2.029353227860674,
    "reward_max": 3.338584580613919,
    "reward_min": -6.755547066049821,
    "reward_std": 1.9357577390798926,
    "timesteps": 350036880,
    "learntime": 0.19803150300867856,
    "sampletime": 8.654404973844066,
    "best_max_mean": 2.5810795025413036,
    "best_max": 3.6058097556762516
  },
  {
    "gen": 994,
    "reward_mean": 2.704639808718173,
    "reward_max": 3.3669189532449693,
    "reward_min": 2.0407560579231774,
    "reward_std": 0.33436780894939283,
    "timesteps": 350397600,
    "learntime": 0.17441125214099884,
    "sampletime": 8.575108977034688,
    "best_max_mean": 2.5810795025413036,
    "best_max": 3.6058097556762516
  },
  {
    "gen": 995,
    "reward_mean": 1.5895394345748506,
    "reward_max": 3.737301921773572,
    "reward_min": -6.831432988909499,
    "reward_std": 3.156505817096844,
    "timesteps": 350755389,
    "learntime": 0.13477310095913708,
    "sampletime": 8.553836167091504,
    "best_max_mean": 1.5895394345748506,
    "best_max": 3.737301921773572
  },
  {
    "gen": 996,
    "reward_mean": 2.431205130532,
    "reward_max": 4.297030082131666,
    "reward_min": -6.645982099247211,
    "reward_std": 2.0199415180927685,
    "timesteps": 351115464,
    "learntime": 0.1484560421667993,
    "sampletime": 8.591402634046972,
    "best_max_mean": 2.431205130532,
    "best_max": 4.297030082131666
  },
  {
    "gen": 997,
    "reward_mean": 2.30108739223557,
    "reward_max": 3.9422323696247354,
    "reward_min": -7.228842272652513,
    "reward_std": 2.6995081465438604,
    "timesteps": 351474636,
    "learntime": 0.1500527539756149,
    "sampletime": 8.550738845020533,
    "best_max_mean": 2.431205130532,
    "best_max": 4.297030082131666
  },
  {
    "gen": 998,
    "reward_mean": 3.138821190030484,
    "reward_max": 4.037876951349474,
    "reward_min": 2.5356073878620804,
    "reward_std": 0.34550179504695805,
    "timesteps": 351835356,
    "learntime": 0.12627008790150285,
    "sampletime": 8.573213102063164,
    "best_max_mean": 2.431205130532,
    "best_max": 4.297030082131666
  },
  {
    "gen": 999,
    "reward_mean": 2.019739532884566,
    "reward_max": 4.004165569397928,
    "reward_min": -15.560689621181654,
    "reward_std": 3.6415538205825357,
    "timesteps": 352193622,
    "learntime": 0.1336054860148579,
    "sampletime": 8.541589735075831,
    "best_max_mean": 2.431205130532,
    "best_max": 4.297030082131666
  },
  {
    "gen": 1000,
    "reward_mean": -0.38326145188591765,
    "reward_max": 4.942607709126383,
    "reward_min": -42.911911682239875,
    "reward_std": 7.432384335666449,
    "timesteps": 352545072,
    "learntime": 0.1342503889463842,
    "sampletime": 8.439194326056167,
    "best_max_mean": -0.38326145188591765,
    "best_max": 4.942607709126383
  }
]