defaults:
  - _self_

# env setting
model_name: idql
adv_num: 3
agent_num: 1
traj_length: 25
action_dim: 5
act_steps: 1
obs_steps: 2 # prev + current
state_dim_list: [16, 16, 16, 14]
player_list: [adversary_0, adversary_1, adversary_2, agent_0]
player_type: agent_0 # [adversary_0, adversary_1, adversary_2, agent_0]
player_type_idx: 3 # [         0,          1,          2,     3]
discount: 0.99

# device
env_name: tag
device: cuda:0
seed: 0

# path
data_path: ./data
emb_path: ./model/_weight
strength: 500


# IQL
iql_tau: 0.9

# Actor
solver: ddpm
diffusion_steps: 10
sampling_steps: 10
predict_noise: True
ema_rate: 0.9999
actor_learning_rate: 0.0003
actor_hidden_dim: 256
actor_n_blocks: 3
actor_dropout: 0.1
temperature: 0.5
weight_temperature: 5

# Critic
critic_hidden_dim: 256
critic_learning_rate: 0.0003

# Training
gradient_steps: 2000
batch_size: 256
log_interval: 100
save_interval: 100

# model
model:
  noise_schedule: cosine
  beta_schedule: cosine

  # network params
  latent_dim: 32
  hidden_dim: 256
  x_max: 3.0
  x_min: -3.0


# Inference
eval:
  IsAgent: True # [True, False]
  episodes: 50
  rounds: 3

  matd3_path: ./env/tag/weight/5000_4p.pt
  gif_path: ./evaluation/videos/tag/
  result_path: ./evaluation/result #


# hydra
hydra:
  run:
    dir: .
  output_subdir: null
