name: antpush-test
env:
  name: AntPush
  steps: 500  # max steps for env
training:
  episodes: 5  # episodes per policy
  policies: 256  # policies in one generation
  generations: 700
hrl:
  pretrained: ""
  interval: 50
  cdist: 4
  onehot: false