environment:
  RENDER: False
  VENV_SEED: 42
  ENV_NAME: Sweep-v0
  ACTION_DIM: 4
  MAX_TRAIN_STEPS: 40 # 5Hz, 5s
  MAX_EVAL_STEPS: 40
  USE_APPEND: True
  USE_LANG: True
  NUM_LANG_PER_ENV: 800
  LANG_DIM: 768
  DATASET: data/tool_sweep_train.pkl
  DATASET_TEST: data/tool_sweep_test.pkl
  DATASET_LANG: data/tool_lang.pkl
  CAMERA:
    pos:
      - 0.9
      - 0.2
      - 0.25
    euler:
      - 0
      - -2.0
      - 0
    img_w: 128
    img_h: 128
    aspect: 1
    fov: 60
    wrist_offset:
      - 0.05
      - 0.0
      - 0.02
  SUCCESS_THRESHOLD: 0.9

training:
  DEVICE: cuda:0
  IMAGE_DEVICE: cpu
  NUM_CPUS: 20
  CPU_OFFSET: 0
  SEED: 42
  NAME: sweep_sac_reptile_lang
  OUT_FOLDER: result/sweep_sac_reptile_lang/0
  AGENT_NAME: AgentSACReptile
  SAVE_TOP_K: 20
  SAVE_METRIC: cum_reward
  CURRENT_STEP:
  MEMORY_CAPACITY: 30000
  FILL: 500
  ADAPT_ONLINE_WEIGHT: 0.7
  NUM_T: 2
  #
  NUM_ITR: 1000
  NUM_ADAPT_TASK: 1
  NUM_ADAPT_STEP: 5
  NUM_ADAPT_EPISODE: 20
  NUM_ADAPT_UPDATE: 100
  NUM_STATE_STACK: 0
  NUM_ACTION_STACK: 0
  META_UPDATE_PERIOD: 1
  #
  CHECK_OPT_FREQ: 50
  NUM_EVAL_TASK: 9
  NUM_EVAL_EPISODE: 1
  #
  EVAL: False
  BATCH_SIZE: 128
  UPDATE_PERIOD: 1
  ALPHA: 0.01
  LEARN_ALPHA: False
  GAMMA: 0.99
  GAMMA_SCHEDULE: false
  LR_A: 0.0003
  LR_Al: 0.0003
  LR_C: 0.0003
  LR_A_META: 0.001
  LR_Al: 0.001
  LR_C_META: 0.001
  LR_A_SCHEDULE: false
  LR_Al_SCHEDULE: false
  LR_C_SCHEDULE: false
  TAU: 0.01
  TARGET_ENTROPY: -3

arch:
  ACTOR_PATH:
  CRITIC_PATH:
  OBS_CHANNEL: 3
  LANG: True
  LANG_DIM: 768
  KERNEL_SIZE:
  - 7
  - 5
  - 3
  STRIDE:
  - 4
  - 3
  - 2
  PADDING:
  - 0
  - 0
  - 0
  N_CHANNEL:
  - 4
  - 8
  - 16
  ACTIVATION:
    actor: ReLU
    critic: ReLU
  MLP_DIM:
    actor:
    - 128
    - 128
    critic:
    - 128
    - 128
  APPEND_DIM: 
    actor: 0
    critic: 0
  USE_BN: False
  USE_LN: True
  USE_SM: False
  TIE_CONV: True
  USE_FILM: False
  DUAL_CONV: True
