defaults:
  - _self_

# env setting
model_name: bc
adv_num: 1
agent_num: 1
traj_length: 6
action_dim: 4
state_dim_list: [72, 72]
player_list: [agent_0, agent_1]
player_type: agent_0 # [adversary_0, agent_0]
player_type_idx: 0 # [   0,         1]

# device
env_name: holdem
device: cuda:0
seed: 0

# model path
policy_path: ./model/baseline/BC/_weight
strength: 500 # 50, 100, 250, 500

# train
train:
  batch_size: 256
  weight_save_path: ./model/baseline/BC/_weight
  data_path: ./data

  # train
  total_epochs: 300
  weight_decay: 1e-3
  lr: 1e-4

  # save
  step_save_weight: 5

# evaluation
eval:
  IsAgent: True # [True, False]
  episodes: 100
  rounds: 10
  # path
  nfsp_path: ./env/holdem/result/model_4500.pth # 4500, 10000, 1000
  gif_path: ./evaluation/videos/holdem/
  result_path: ./evaluation/result

# model
model:
  latent_dim: 32
  hidden_dim: 256
  cond_dim: 128

hydra:
  run:
    dir: .
  output_subdir: null
