[
  {
    "gen": 200,
    "reward_mean": 1.826038165786484,
    "reward_std": 6.969379981558661e-09,
    "timesteps": 64382958,
    "best_max_mean_sampling": 1.8438424855624782,
    "best_max_sampling": 2.4353959641779146,
    "episodes": 32
  },
  {
    "gen": 400,
    "reward_mean": 1.7662646793172194,
    "reward_std": 7.450580596923828e-09,
    "timesteps": 136474590,
    "best_max_mean_sampling": 1.845385926277884,
    "best_max_sampling": 2.503494267680003,
    "episodes": 32
  },
  {
    "gen": 600,
    "reward_mean": 1.7662646793172194,
    "reward_std": 7.450580596923828e-09,
    "timesteps": 208575396,
    "best_max_mean_sampling": 1.845385926277884,
    "best_max_sampling": 2.503494267680003,
    "episodes": 32
  },
  {
    "gen": 800,
    "reward_mean": 1.7662646793172194,
    "reward_std": 7.450580596923828e-09,
    "timesteps": 280673181,
    "best_max_mean_sampling": 1.845385926277884,
    "best_max_sampling": 2.503494267680003,
    "episodes": 32
  },
  {
    "gen": 1000,
    "reward_mean": 3.7087402383073487,
    "reward_std": 1.0536712127723509e-08,
    "timesteps": 352545072,
    "best_max_mean_sampling": -0.38326145188591765,
    "best_max_sampling": 4.942607709126383,
    "episodes": 32
  },
  {
    "gen": 1200,
    "reward_mean": 8.366702684444133,
    "reward_std": 1.148211584048155e-08,
    "timesteps": 424111227,
    "best_max_mean_sampling": 6.671526063676533,
    "best_max_sampling": 9.96469847913712,
    "episodes": 32
  },
  {
    "gen": 1400,
    "reward_mean": 19.975574504459775,
    "reward_std": 1.8250120749944284e-08,
    "timesteps": 495627879,
    "best_max_mean_sampling": 17.889918623988216,
    "best_max_sampling": 23.95931725036071,
    "episodes": 32
  },
  {
    "gen": 1600,
    "reward_mean": 22.1489091215047,
    "reward_std": 2.5809568279517847e-08,
    "timesteps": 566554188,
    "best_max_mean_sampling": 13.642681692213058,
    "best_max_sampling": 25.03806481092599,
    "episodes": 32
  },
  {
    "gen": 1800,
    "reward_mean": 22.1489091215047,
    "reward_std": 2.5809568279517847e-08,
    "timesteps": 636147039,
    "best_max_mean_sampling": 13.642681692213058,
    "best_max_sampling": 25.03806481092599,
    "episodes": 32
  },
  {
    "gen": 2000,
    "reward_mean": 22.1489091215047,
    "reward_std": 2.5809568279517847e-08,
    "timesteps": 706683864,
    "best_max_mean_sampling": 13.642681692213058,
    "best_max_sampling": 25.03806481092599,
    "episodes": 32
  }
]