env: tensorgame

env_args:
  #n_agents: 5
  #n_actions: 5
  #target: 4
  #rewards: [0.2, 0.1, 0.6, 0.4, 1.0, 0.7]
  n_agents: 3
  n_actions: 3
  target: 2
  rewards: [0.6, 0, 1.0, 0.5]
  episode_limit: 10

use_rnn: False
test_greedy: True
test_nepisode: 10
test_interval: 500
log_interval: 500
runner_log_interval: 100
learner_log_interval: 100
t_max: 2005000

hidden_dim: 4
obs_agent_id: True
obs_last_action: False

random_output: True