defaults:
  - _self_
  - algo: ddpg
  - task: Ant-v3
  - hyperparams: ${algo}/${task}
  - override hydra/job_logging: colorlog
  - override hydra/hydra_logging: colorlog
  - override hydra/launcher: joblib

seed: 1
torch_deterministic: true
use_gpu: true
auto_gpu: true
# NOTE: use the following if not using multiple gpus for experiments
device: cpu

total_timesteps: 1_500_000

ts: ${now:%y-%m-%d_%H-%M-%S}

dris:
  enable: true
  t: 1e8
  actor_strategy: 'none'
  clip: ${ln:2}
  auto_tune: true
  clip_r_th: 0.01
  t_mul: 1.01
  update_freq: 8
  is_flip : false
  verbose: ${..verbose}

wandb:
  launch: true
  project: mujoco_paper
  name: ${algo.name}_${task.name}_${ts}
  entity: project

mode: debug
run_dir: ./runs/${mode}/${ts}/${algo.name}/${task.name}
capture_video: false
checkpoint_dir: ${run_dir}/checkpoints
total_eval_cnt: 200
verbose: true # turn to false to stop tracking and logging extra metrics

check_keys:
  - dris
  - algo
  - task
  - hyperparams
  - seed
  - total_timesteps
  - mode

hydra:
  run:
    dir: ${run_dir}
  
  sweep:
    dir: ${run_dir}
    subdir: ${hydra.job.override_dirname}/seed=${seed}
  
  job:
    env_set:
      HYDRA_FULL_ERROR: "1"
      WANDB_START_METHOD: "thread"
    config:
      override_dirname:
        exclude_keys:
          - seed
          - algo
          - task
  
  launcher:
    n_jobs: 24

work_dir: ${hydra:runtime.cwd}
rerun: false