env: mpe_spread

env_args:
  n_agents: 3
  grid_size: 5
  episode_limit: 50
  gamma: 0.99
  neighborhood: 1

learner_log_interval: 20000
log_interval: 20000
runner_log_interval: 20000
t_max: 10050000
test_interval: 20000
test_nepisode: 24
test_greedy: True
