seeds: [0, 1, 2, 3,4,5,6,7,8,9]
  # --- Collection ---
collection:
  eval_envs:
    - "reach-v3"
    - "push-v3"
    - "pick-place-v3"
    - "door-open-v3"
    - "drawer-open-v3"
    - "drawer-close-v3"
    - "button-press-topdown-v3"
    - "peg-insert-side-v3"
    - "window-open-v3"
    - "window-close-v3"

  # shared defaults for all tasks
  max_steps: 150
  camera_name: "corner"
  render_mode: "rgb_array"
  success_episodes: 20
  tasks:
    - { env_name: "reach-v3", desc: "Reach a goal position."}
    - { env_name: "push-v3", desc: "Push the puck to a goal."}
    - { env_name: "pick-place-v3", desc: "Pick and place a puck to a goal."}
    - { env_name: "door-open-v3", desc: "Open a door with a revolving joint."}
    - { env_name: "drawer-open-v3", desc: "Open a drawer."}
    - { env_name: "drawer-close-v3", desc: "Push and close a drawer."}
    - { env_name: "button-press-topdown-v3", desc: "Press a button from the top."}
    - { env_name: "peg-insert-side-v3", desc: "Insert a peg sideways." }
    - { env_name: "window-open-v3", desc: "Push and open a window." }
    - { env_name: "window-close-v3", desc: "Push and close a window." }

# --- Evaluation dataset for reward computation ---
dataset_eval:
  root_dir: "."      # parent containing collected splits (e.g., pick-place-v3_50)
  img_size: 224
  num_workers: 4
  normalize: true
  stride: 8

# --- Model ---
model:
  device: "cuda:2"
  clip_model: "ViT-B-32"
  pretrained_clip: "openai"
  projection_dim: 64 #1024
  checkpoint_path: "../checkpoints/f_vlm_adapt_epoch5_lambda0.5_proj64_rand_wsize8_nwind_8_final_64_8rws_8nw_20250514-142312.pth"
  checkpoint_path_ft: "../checkpoints/vlm_adapt_epoch50_lambda0.5_proj1024_rand_wsize8_nwind_8_final_clip_ft_retrained_20250515-111130.pth"

# --- Training (IQL + eval knobs we read) ---
training:
  iql_device: "cuda:2"
  iql_n_steps: 100000
  iql_n_steps_per_epoch: 10000
  eval_episodes: 20
  eval_max_steps: 150


# --- Test-Time Training (for rewards) ---
evaluation:
  reward_methods: ["clip_reg"] # online","offline","window","clip","clip_reg" 
  expert: False
  ttt_lr: 0.1
  ttt_epochs: 1
