defaults:
  - _self_
  - model: default

use_origin_img: True

textEmbeded:
  lang_pdrop: 0.0

env: 
  num_actions: 7
  control: 'ee' # 'ee'
  # num_states: 10
  bins: 50
  client: localhost:30007
  mode: 'grasping'
  max_steps: 50
#   test:
#     _target_: ${..train._target_}
#     id: ${..train.id}
#     size: ${..train.size}
#     max_episode_steps: 108000
#     noop_max: 1
#     frame_skip: ${..train.frame_skip}
#     done_on_life_loss: False
#     clip_reward: False

datasets:
  num_worker: 8
  batch_size: 16
  sample_frame: 8
  history_len: 1
  train:
    _target_: feeders.Feeder
    control: ${env.control}
    data_path:
      - ???

    instructions_path: ???
    history_len: ${datasets.history_len}
    instructions_level: 
      # - 0
      - 1
      - 2
      - 3
      - 4
    sample_frame: ${datasets.sample_frame}
    bin: 50
    img_size: 224
    data_size: null
    dataAug: True
  test:
    _target_: feeders.Feeder
    control: ${env.control}
    data_path:
      - ???
    instructions_path: ???
    history_len: ${datasets.history_len}

    instructions_level: 
      # - 0
      - 1
      - 2
      - 3
      - 4
    sample_frame: ${datasets.sample_frame}
    bin: 50
    img_size: 224
    data_size: 100
    dataAug: False
  eval:
    instr_path: ???
    history_len: ${datasets.history_len}
    levels: 
      # - 0
      # - 1
      # - 2
      # - 3
      - 4
    data_path:
      - ???
    control: ${env.control}

wandb:
  mode: online
  project: KeyWorld
  entity: null
  name: null
  group: null
  tags: null
  notes: null

common:
  epochs: 200
  device: cuda:0
  do_checkpoint: True
  seed: 0
  sequence_length: 1 # ${world_model.max_blocks}
  resume: False # set by resume.sh script only.

initialization:
  path_to_checkpoint: 
  load_tokenizer: False
  load_world_model: True 
  load_actor: True

training:
  should: True

  agent:
    batch_num_samples: 64
    grad_acc_steps: 1
    max_grad_norm: 10.0
    weight_decay: 0.001 #0.00001 # 0.01
    start_after_epochs: 0
    learning_rate: 0.0001 # 0.00001
    lr_scheduler_func: CosineAnnealingLR # StepLR CosineAnnealingLR
    lr_scheduler_config: 
      T_max: 10
      eta_min: 0.0000005 # 0.000001 # 0.0000005
      # step_size: 20
    loss_weight:
      - 1
      - 1

evaluation:
  should: True
  every: 1
  agent:
    batch_num_samples: 64
    grad_acc_steps: 1
    max_grad_norm: 10.0
    start_after_epochs: 0
