defaults:
  - configs/dreamer
  - agent: dreamer
  - configs: ${configs}
  - override hydra/launcher: submitit_local

# mode
reward_free: true
# task settings
task: none
domain: walker # primal task will be infered in runtime

# train settings
num_train_frames: 2000010
num_seed_frames: 4000
# eval
eval_every_frames: 10000
num_eval_episodes: 10
# snapshot
snapshots: [100000, 500000, 1000000, 2000000] 
snapshot_dir: ../../../pretrained_models/${obs_type}/${domain}/${agent.name}/${separate_wm}_${seed}
# replay buffer
replay_buffer_size: 1000000
replay_buffer_num_workers: 4
# misc
seed: 1
device: cuda
save_video: false
save_train_video: true
use_tb: true
use_wandb: true

# separate
disen_scales: {discount: 2000.0, disen_only: 1.5, kl_disen: 1.0, proprio: 1.0, reward: 20000.0}
separate_wm: false
disen_disagreement: false

# experiment
experiment: pt
project_name: exp

# log settings
log_every_frames: 1000
recon_every_frames: 20000


hydra:
  run:
    dir: ./exp_local/${now:%Y.%m.%d}/${now:%H%M%S}_${agent.name}_se_${separate_wm}_${domain}_${seed}
  sweep:
    dir: ./exp_sweep/${now:%Y.%m.%d}/${now:%H%M}_${agent.name}_se_${separate_wm}_${domain}_${seed}_${experiment}
    subdir: ${hydra.job.num}
  launcher:
    timeout_min: 4300
    cpus_per_task: 10
    gpus_per_node: 1
    tasks_per_node: 1
    mem_gb: 160
    nodes: 1
    submitit_folder: ./exp_sweep/${now:%Y.%m.%d}/${now:%H%M}_${agent.name}_se_${separate_wm}_${domain}_${seed}_${experiment}/.slurm
