defaults:
  - _self_

# env setting
model_name: ddgi
adv_num: 3
agent_num: 1
traj_length: 25
action_dim: 5
state_dim_list: [16, 16, 16, 14]
player_list: [adversary_0, adversary_1, adversary_2, agent_0]
player_type: agent_0 # [adversary_0, adversary_1, adversary_2, agent_0]
player_type_idx: 3 # [         0,          1,          2,     3]

# device
env_name: tag
device: cuda:0

# model path
policy_path: ./model/_weight
strength: 500 # 50, 100, 250, 500
seed: 0 # 0, 10, 50
use_ddgi: True

# train
train:
  batch_size: 256
  weight_save_path: ./model/_weight
  plot_save_path: ./model/_result
  data_path: ./data

  # logger
  step_epoch_log: 10
  logs_path: ./model/_logs
  logs_message: ""

  # train
  policy_total_epochs: 600
  weight_decay: 1e-4
  lr: 3e-4
  use_ema: True # [True, False]
  ema_rate: 0.995

  # save
  step_save_weight: 5

# evaluation
eval:
  IsAgent: True # [True, False]
  episodes: 100 ##
  rounds: 10 ##

  # path
  matd3_path: ./env/tag/weight/30000_4p.pt # 30000, 15000, 5000
  gif_path: ./evaluation/videos/tag/
  result_path: ./evaluation/result
  data_path: ./evaluation/data

# model
model:
  sample_steps: 15
  temperature: 1.0
  weight_rate: 1.0
  noise_schedule: cosine
  beta_schedule: cosine

  # network params
  latent_dim: 32
  hidden_dim: 256
  cond_dim: 128
  timestep_emb_type: positional
  alpha: 0.1
  gamma: 0.9
  x_max: 3.0
  x_min: -3.0

  d_weight: 1.0
  sample_alpha: 0.75 # 0.0, 0.25, 0.5, 0.75, 0.9, 1.0

hydra:
  run:
    dir: .
  output_subdir: null
