defaults:
  - _self_

# env setting
model_name: ddgi
adv_num: 0
agent_num: 2
traj_length: 25
action_dim: 50
state_dim_list: [21, 21]
player_list: [agent_0, agent_1]
player_type: agent_0 # [agent_0, agent_1]
player_type_idx: 0 # [   0,    1]

# device
env_name: reference
device: cuda:0

# model path
policy_path: ./model/_weight
strength: 500 # 50, 100, 250, 500
seed: 0 # 0, 10, 50
use_ddgi: False # False

# train
train:
  batch_size: 256
  weight_save_path: ./model/_weight
  plot_save_path: ./model/_result
  data_path: ./data

  # logger
  step_epoch_log: 10
  logs_path: ./model/_logs
  logs_message: ""

  # train
  policy_total_epochs: 600
  weight_decay: 1e-4
  lr: 3e-4
  use_ema: True # [True, False]
  ema_rate: 0.995

  # save
  step_save_weight: 5

# evaluation
eval:
  IsAgent: True # [True, False]
  episodes: 100 ##
  rounds: 3 ##

  # path
  matd3_path: ./env/reference/weight/30000.pt # 15000, 5000
  gif_path: ./evaluation/videos/reference/
  result_path: ./evaluation/result
  data_path: ./evaluation/data

# model
model:
  sample_steps: 15
  temperature: 1.0
  noise_schedule: cosine
  beta_schedule: cosine

  # network params
  latent_dim: 32
  hidden_dim: 256
  cond_dim: 128
  timestep_emb_type: positional
  alpha: 0.1
  gamma: 0.9
  x_max: 3.0
  x_min: -3.0

  d_weight: 1.0 # 2.0, 4.0, 8.0, 16.0
  sample_alpha: 0.75 # 0.0, 0.25, 0.5, 0.75, 0.9, 1.0

hydra:
  run:
    dir: .
  output_subdir: null
