defaults:
  - _self_

# env setting
model_name: ddgi
adv_num: 1
agent_num: 1
traj_length: 6
action_dim: 4
state_dim_list: [72, 72]
player_list: [agent_0, agent_1]
player_type: agent_0 # [agent0, agent1]
player_type_idx: 0 # [     0,      1]

# device
env_name: holdem
device: cuda:0
seed: 0 # 0, 10, 50

# model path
emb_path: ./model/_weight
policy_path: ./model/_weight
strength: 500 # 50, 100, 250, 500
use_ddgi: True

# train
train:
  batch_size: 256
  weight_save_path: ./model/_weight
  plot_save_path: ./model/_result
  data_path: ./data

  # logger
  step_epoch_log: 10
  logs_path: ./model/_logs
  logs_message: ""

  # train
  policy_total_epochs: 600
  weight_decay: 1e-4
  lr: 3e-4
  use_ema: True # [True, False]
  ema_rate: 0.995

  # save
  step_save_weight: 5

# evaluation
eval:
  IsAgent: True # [True, False]
  episodes: 100
  rounds: 10 ##

  # path
  nfsp_path: ./env/holdem/result/model_4500.pth # 4500, 10000, 1000
  gif_path: ./evaluation/videos/holdem/
  result_path: ./evaluation/result
  data_path: ./evaluation/data

# model
model:
  sample_steps: 15
  temperature: 1.0
  noise_schedule: cosine
  beta_schedule: cosine

  # network params
  latent_dim: 64
  hidden_dim: 256
  cond_dim: 128
  timestep_emb_type: positional
  alpha: 0.1
  gamma: 0.9
  x_max: 3.0
  x_min: -3.0

  d_weight: 1.0 # 1, 5, 10
  sample_alpha: 0.5 # 0.0, 0.25, 0.5, 0.75, 0.9, 1.0

hydra:
  run:
    dir: .
  output_subdir: null
