attacker: "hyar"
defender: "qmix"

runner: "ad_parallel"
batch_size_run: 12 

buffer_size: 5000

# update the target network every {} episodes
target_update_interval: 200

t_max: 21100000 
attacker_stop: 20100000 
defender_start: 1000000 

checkpoint_path: ''

load_step: 0
use_tensorboard: False
use_wandb: True 

concurrent_train: True
switch_interval: 200000 
attacker_train: 1000000 
defender_train: 200000 
reinit_attacker: True

discrete_action_dim: 8 
parameter_action_dim: 64 
ad_policy_reward_scale: -100.0
add_history_attacker: True
perturbation_range: 10.0

attacker_update_repeat: 6
defender_update_repeat: 3
n_attackers: 20 
reproduction_ratio: 0.25 
distance_threshold: 0.25
# parameters for trajectory encoder
enc_emb: 16
enc_heads: 3
enc_depth: 16
dec_emb: 16
traj_attacker_action: False
traj_defender_action: False
traj_encoder: "transformer_encoder"
traj_decoder: "rnn_decoder"

# --- defense module specific parameters ---
defense_loaded: False

attack_agent_0: False

name: "ad"