minatar:
  discount: 0.99
  duration: 5_000_000
  epsilon: minatar
  extractor: minatarcnn
  prepop: 5_000
  rmem_size: 100_000
  target_period: 1_000
  train_period: 4

cartpole: &cartpole
  discount: 0.99
  duration: 500_000
  env: CartPole-v1
  epsilon: 0.05
  extractor: mlpcontrol
  prepop: 5_000
  rmem_size: 100_000
  target_period: 500
  train_period: 4

lunar:
  <<: *cartpole
  env: LunarLander-v2
