defaults:
  - _self_
  - task@_global_: manipulator_bring_ball
  - agent@_global_: drm_mw
  - override hydra/launcher: submitit_local

# task settings
frame_stack: 3
action_repeat: 2 # dmc = 4, mw = 2
discount: 0.99
# train settings
num_seed_frames: 4000 # carla=400, others=4000
update_every_steps: 2
# eval
eval_every_frames: 10000
num_eval_episodes: 10
# snapshot
save_snapshot: false
# wandb
use_wandb: false
# replay buffer
replay_buffer_num_workers: 4
nstep: 3
batch_size: 256
# misc
save_video: false
save_train_video: false
use_tb: true
#experiment: exp_drq
#experiment: exp_my_05m
experiment: exp_02m
port: 22024
# agent
lr: 1e-4
feature_dim: 50
seed: 122
replay_buffer_size: 200000 # carla=100000，others=200000
device: cuda:0
PredictedDiff: True # True=V5, False=V4
AvgStateR: True # Avg=True
StandardAug: false # bzaug=True, nowaug=False
int_weight: 0.05 #place=0.1, other: 0.005 (0.05), cheetah:40 (dog_stand V4:1.0, Step3:2.0, Step1:40)
pre_train_step: 0 #
num_train_frames: 3002000
hydra:
  run:
    #dir: ./exp_local/${now:%Y.%m.%d}/${now:%H%M%S}_${hydra.job.override_dirname}_exp_bsmrint_rL2_encL2_0.02riV2_R(sa)_noVar_rap(tr)_V5_02m_125 #exp_distr+r+05ri+1stp_02m_121
    #dir: ./exp_local/${now:%Y.%m.%d}/${now:%H%M%S}_${hydra.job.override_dirname}_Tea_v5_nowaug_w${int_weight}_${seed}_alll1_clip01 #exp_distr+r+05ri+1stp_02m_121
    # no bisim+ri
    dir: ./exp_local/${now:%Y.%m.%d}/${now:%H%M%S}_${experiment}_${seed} #exp_distr+r+05ri+1stp_02m_121

    #dir: ./exp_local/${now:%Y.%m.%d}/${now:%H%M%S}_${hydra.job.override_dirname}_Tea_B256_V6_002_1work_lin_norm_121 #exp_distr+r+05ri+1stp_02m_121
    #dir: ./exp_local/${now:%Y.%m.%d}/${now:%H%M%S}_${hydra.job.override_dirname}_B256_ICM_${seed} #exp_distr+r+05ri+1stp_02m_121
# nohup python train_dmc.py task=humanoid_stand agent=drqv2_myv3 > ./log/run_v5_step1_myv3_l1smooth1_121.log 2>&1 &

# nohup python train_mw.py task=pick-place agent=drqv2_myv3 > ./log/run_v5_step1_myv3_l1smooth1_mw_121v.log 2>&1 &

# nohup python train_dmc.py task=cheetah_run agent=drqv2_myv3 > ./log/run_myv3_seed122_nobisim+ri_dmc_clip.log 2>&1 &

# nohup python train_mw.py task=coffee-push agent=drqv2_myv3 > ./log/run_new_myv3_seed121_l1smooth01_mw_clip_s.log 2>&1 &

#nohup python train_mw.py task=pick-place agent=drm_mw > ./log/run_new_myv3_seed123_l1smooth1000_mw.log 2>&1 &
#nohup python train_mw.py task=pick-place agent=drqv2_myv3 > ./log/run_new_myv3_seed123_l1smooth1000_mw.log 2>&1 &
#nohup python train_mw.py task=pick-place agent=drqv2_myv3 > ./log/run_new_myv3_seed123_l1smooth1000_mw.log 2>&1 &
#nohup python train_mw.py task=pick-place agent=drqv2_myv3 > ./log/run_new_myv3_seed123_l1smooth1000_mw.log 2>&1 &
#nohup python train_mw.py task=pick-place agent=drqv2_myv3 > ./log/run_new_myv3_seed123_l1smooth1000_mw.log 2>&1 &

  sweep:
    dir: ./exp/${now:%Y.%m.%d}/${now:%H%M}_${agent_cfg.experiment}
    subdir: ${hydra.job.num}
  launcher:
    timeout_min: 4300
    cpus_per_task: 10
    gpus_per_node: 1
    tasks_per_node: 1
    mem_gb: 400
    nodes: 1
    submitit_folder: ./exp/${now:%Y.%m.%d}/${now:%H%M%S}_${agent_cfg.experiment}/.slurm

# Available options in 'task':
#         acrobot_swingup
#         acrobot_swingup_sparse
#         adroit_medium
#         assembly
#         basketball
#         bin-picking
#         box-close
#         carla_down04
#         cartpole_swingup_sparse
#         cheetah_run
#         coffee-button
#         coffee-pull
#         coffee-push
#         dial-turn
#         disassemble
#         dog_run
#         dog_stand
#         dog_trot
#         dog_walk
#         door
#         door-close
#         door-open
#         easy
#         finger_turn_hard
#         hammer
#         hard
#         hopper_hop
#         humanoid_run
#         humanoid_stand
#         humanoid_walk
#         manipulator_bring_ball
#         medium
#         metaworld
#         peg-insert-side
#         pen
#         pick-place
#         pick-place-wall
#         push
#         quadruped_run
#         quadruped_walk
#         reacher_easy
#         reacher_hard
#         relocate
#         soccer
#         stick-pull
#         stick-push
#         sweep-into
#         walker_run
#         walker_walk
#         window-open