defaults:
  - env: env_config.yaml
  - agent: multi_diayn

# mode
reward_free: true
obs_type: states # [states, pixels]
frame_stack: 3 # only works if obs_type=pixels
action_repeat: 1 # set to 2 for pixels
discount: 0.99 # ??? # 0.95 # 0.99
# train settings
num_train_frames: 4000010
num_seed_frames: 24000 # due to replay buffer sampling from episode, having a large num seed frames is actually important
# eval
eval_every_frames: 100000
num_eval_episodes: 10 #10 # 0
# replay buffer
replay_buffer_size: 1000000 # 1000000
replay_buffer_num_workers: 4
batch_size: ${agent.batch_size}
nstep: ${agent.nstep}
update_encoder: true # should always be true for pre-training
# misc
seed: 1 # needs to be > 0
cuda_id: 0
save_video: false
save_train_video: false
use_tb: false
use_wandb: true

her: false

# These two should scale proportionally
n_updates: 2
n_env: 4

# task settings
domain: quadruped # toy # igibson # moma2d # particle # quadruped

exp_nm: ""

exp_group:
  ${domain}
  ${agent.name}
  ${exp_nm}
#  r_dist:${agent.return_dist}
#  Q_range:${agent.Q_range}
#  her:${her}
#  use_ext:${agent.add_task_reward}

#  schedule_anti:${agent.anti}
#  spn:${agent.use_spectral_norm}
#  sac:${agent.sac}
#  critic:${agent.critic_type}
#  simp:${env.particle.simplify_action_space}
#  temp:${agent.init_temperature}
#  anti_coef:${agent.anti_coef}
#  trans:${agent.update_skill_every_step}
#  mask:${agent.mask_out_transitions}
#  skt:${agent.update_skill_inter_episode}
#  skdim:${agent.skill_dim}
#  par:${agent.parted}
#  thres:${agent.update_skill_threshold}

#exp_group:
#  ${domain}
#  N:${env.particle.N}
#  sac:${agent.sac}
#  nc:${agent.skill_channel}
#  act:${agent.actor_type}


experiment:
  seed:${seed}
  ${exp_group}

# snapshot
snapshots: [100000, 500000, 1000000, 2000000, 3000000, 4000000]
snapshot_dir: ../../../models/${obs_type}/${domain}/${experiment}/${seed}


hydra:
  run:
    dir: ./exp_local/${now:%Y.%m.%d}/${now:%H%M%S}_${experiment}
  sweep:
    dir: ./exp_sweep/${now:%Y.%m.%d}/${now:%H%M}_${experiment}
    subdir: ${hydra.job.num}
