defaults:
  - _self_

# env setting
model_name: dd
adv_num: 1
agent_num: 1
traj_length: 42
action_dim: 7
player_list: [agent_0, agent_1]
player_type: agent_0 # [agent_0, agent_1]
player_type_idx: 0 # [     0,      1]

# device
env_name: connect4
device: cuda:0
seed: 0

# path
data_path: ./data
emb_path: ./model/_weight
strength: 250

# Training
diffusion_gradient_steps: 10000
invdyn_gradient_steps: 5000
sample_steps: 25
batch_size: 256
lr: 5e-4
predict_noise: True
next_obs_loss_weight: 10.
ema_rate: 0.9999
temperature: 1.0
log_interval: 100
save_interval: 100

# model
model:
  noise_schedule: cosine
  beta_schedule: cosine

  # network params
  solver: ddim
  emb_dim: 128
  horizon: 42
  latent_dim: 64
  hidden_dim: 256

# Inference
eval:
  IsAgent: True # [True, False]
  episodes: 100
  rounds: 10
  opponent: dqn #["random", "weak", "strong", "dqn"]

  dqn_path: ./env/connect4/weight/lesson4_agent.pt
  gif_path: ./evaluation/videos/connect4/
  result_path: ./evaluation/result

# hydra
hydra:
  run:
    dir: .
  output_subdir: null
