# @package _global_
learning_rate: 1e-5
lm_learning_rate: 1e-7
weight_decay: 1e-4
os_learning_rate: 1e-5
smooth_loss_scale: 1e8
smooth_gamma: 0.2
llm_update_epoch: 20
deterministic: False
segment_model: model_100.ckpt

model:
  state_reconstruct: False
  
env:
  name: MiniGrid-DoorKey-8x8-v0
  state_dim: (3, 7, 7) # (3, 480, 640)
  action_dim: 1
  discrete: False
  eval_offline: False
  use_state: False
  eval_episode_factor: 10
  eval_env: 

option_selector:    
  commitment_weight: 5
  reset: False
  num_options: 5
  decay: 0.99 

train_dataset:
  expert_location: 
  num_trajectories: 40108
  normalize_states: False
  no_lang: False
  seed: ${seed}
  aug: True

val_dataset:
  expert_location: 
  num_trajectories: ${trainer.num_eval_episodes}
  normalize_states: False
  seed: ${seed}
  aug: True

llm_segment_image:
  save_dir: 

trainer:
  device:  ## to be filled in code
  state_il: False
  num_eval_episodes: 5
  eval_every: 5
  K: ${model.K}