# --- MADDPG  NSspecific parameters ---

runner: "episode"
batch_size_run: 1

buffer_size: 50000
# update the target network every {} episodes
target_update_interval_or_tau: 0.01

obs_agent_id: False
# obs_last_action: False
# obs_individual_obs: False


# use the maddpg_learner to train
agent: "rnn_ns"
mac: "maddpg_mac"
reg: 0.001
batch_size: 16
lr: 0.0005
standardise_returns: False
standardise_rewards: True
# use_rnn: False
learner: "maddpg_learner"
agent_output_type: "pi_logits"
hidden_dim: 128
critic_type: "maddpg_critic_ns"

name: "maddpg_ns"w
on_policy: False
