defaults:
  - _self_
  - env: point_maze
  - encoder: dino 
  - action_encoder: proprio
  - proprio_encoder: proprio
  # - decoder: vqvae
  - decoder: transposed_conv
  - predictor: vit
  - override hydra/launcher: submitit_slurm

# base path to save model outputs. Checkpoints will be saved to ${ckpt_base_path}/outputs.
ckpt_base_path: ./ # put absolute path here

hydra:
  run:
    dir: ${ckpt_base_path}/outputs/${now:%Y-%m-%d}/${now:%H-%M-%S}
  sweep:
    dir: ${ckpt_base_path}/outputs/${now:%Y-%m-%d}/${now:%H-%M-%S}
    subdir: ${hydra.job.num}
  launcher:
    submitit_folder: ${hydra.sweep.dir}/.submitit/%j
    nodes: 1
    tasks_per_node: 1
    cpus_per_task: 8
    mem_gb: 512
    gres: "gpu:h100:1"
    timeout_min: 2880
    setup: ["export DEBUGVAR=$(scontrol show hostnames $SLURM_JOB_NODELIST)",
            export MASTER_ADDR="$(scontrol show hostnames $SLURM_JOB_NODELIST | head -n 1)",
            "export MASTER_PORT=$(for port in $(shuf -i 30000-65500 -n 20); do if [[ $(netstat -tupln 2>&1 | grep $port | wc -l) -eq 0 ]] ; then echo $port; break; fi; done;)",]

training:
  seed: 0
  epochs: 200
  batch_size: 96 # should >= nodes * tasks_per_node
  save_every_x_epoch: 10
  reconstruct_every_x_batch: 500
  num_reconstruct_samples: 6
  encoder_lr: 1e-7
  decoder_lr: 5e-4
  predictor_lr: 5e-4
  action_encoder_lr: 5e-4

img_size: 140 # should be a multiple of 224
frameskip: 4
concat_dim: 1

# # square
# train_data_path: 'path_to_train'
# val_data_path: 'path_to_val'
# view_names: ['agentview_image', 'robot0_eye_in_hand_image']

# # tool_hang
# train_data_path: 'path_to_train'
# val_data_path: 'path_to_val'
# view_names: ['sideview_image', 'robot0_eye_in_hand_image']

# transport
train_data_path: 'path_to_train'
val_data_path: 'path_to_val'
view_names: ['robot0_eye_in_hand_image', 'robot1_eye_in_hand_image', 'shouldercamera0_image', 'shouldercamera1_image']

# # pusht
# train_data_path: 'path_to_train'
# val_data_path: 'path_to_train'
# view_names: ['image']

# view_names: ['agentview']
use_resnet_encoder: True
use_layernorm: True
policy_ckpt_path: 'path_to_policy_ckpt'
action_conditioned_time_contrastive: False
contrastive_loss_type: 'contrastive'
contrastive_loss_level: 'patch'
normalize_for_contrastive: True
disable_reconstruction: False
minimize_recon_loss_pred: False
triplet_loss_margin: 0.35
use_crop: True
gradual_unfreezing: False
abs_action: True
# view_names: ['agentview']
normalize_action: True

# action encoder
action_emb_dim: 128
num_action_repeat: 1

# proprio encoder
proprio_emb_dim: 16
num_proprio_repeat: 1

num_hist: 1
num_pred: 1 # only supports 1
has_predictor: True # set this to False for only training a decoder
has_decoder: False # set this to False for only training a predictor
use_pretrained_encoder: True
encoder_ckpt_path: null
predictor_ckpt_path: null
decoder_ckpt_path: null
model:
  _target_: dino_wm.models.visual_world_model.VWorldModel
  image_size: ${img_size}
  num_hist: ${num_hist}
  num_pred: ${num_pred}
  train_encoder: False
  train_predictor: True
  train_decoder: False

debug: False 

# Planning params for planning eval jobs launched during training
plan_settings: 
  # plan_cfg_path: conf/plan.yaml # set to null for no planning evals
  plan_cfg_path: null 
  planner: ['gd', 'cem']
  goal_source: ['dset', 'random_state']
  goal_H: [5]
  alpha: [0.1, 1]