# --- Dataset / Loader ---
dataset:
  root_dir_train: "../datasets_smpl"
  root_dir_val: "../datasets_smpl"
  train_split: "training_many_skills"
  val_split: "bridge_many_skills_exp"
  batch_size: 32 
  traj_len: 120
  img_size: 224
  shuffle: true
  num_workers: 0
  normalize: true
  pin_memory: false

dataset_eval:
  root_dir: "../datasets_smpl"
  splits:
    - "bridge_many_skills_exp"
    - "tabletop_dark_wood_fold_cloth_pnp_200"
    - "minsky_folding_table_white_tray_sweep_granular_100"
    - "laundry_machine_pnp_sweep_200"
    - "folding_table_fold_cloth_pnp_200"
    - "robot_desk_fold_cloth_200"
    - "deepthought_toykitchen1_many_skills_200"
    - "deepthought_toykitchen2_stack_blocks_200"
    - "deepthought_folding_table_stack_blocks_200"
    - "deepthought_robot_desk_drawer_pnp_200"
    - "script_pnp_objects_200"
    - "script_pnp_rigid_objects_200"
    - "script_pnp_soft_toys_200"
    - "script_pnp_utensils_200"
    - "script_sweep_pnp_200"
  img_size: 224
  num_workers: 4
  normalize: true
  stride: 8

# --- Model Architecture ---
model:
  clip_model: "ViT-B-32"
  pretrained_clip: "openai"
  f_adapt_depth: 1 # Number of residual layers in f_adapt 
  activation: "gelu" # Activation function in f_adapt (gelu/relu)
  projection_dim: [64] # d' in P_K, P_V, P_Q

# --- Training ---
training:
  num_epochs: 5  
  base_lr: 1e-4 # Learning rate for training the full model
  optimizer: "adamw"
  weight_decay: 1e-4
  lambda_self: [0.5]  # Weight for self-supervised loss
  seed: 17
  ttt_lr_eval: 5e-2
  window_size: 8
  ttt_epochs_eval: 5
  cosine_warmup_pct: 0.1
  num_runs: 1
  ignore_window: False
  desc: "train_reproduce"
  gpu: 2
  random_w_size: 8
  num_windows: 8
  temporal_perturb_rate: 0.0
  grad_clip: 1.0 
  batch_sampling: "dissimilarity" #ft, random, mini_batch
  checkpoint:
    dir: "../checkpoints"
    steps: 5  # Save every 5 epochs

# --- Test-Time Training ---
evaluation:
  ttt_lr: [0.1] # Learning rate for updating f_adapt during 
  ttt_epochs: [1] #[1,5,10] # Number of adaptation steps in offline TTT
  ttt_online: false # Whether to run online TTT (True) or offline (False)
  model_dirs: 
    - "path_to_model_dir"
  projection_dims: [64] # d' in P_K, P_V, P_Q
  window_size: [8] #[2,8,16]
  reset: True
  perturbation_rate: 0.5
  shuffling_online: False
  desc: "eval_reproduce"
  gpu: 3
  seed: 17