VERSION: GATv2_EnvGlobalNode_Emb_ILRL
runner: 'VGMRunner'
scene_data: 'gibson'
BASE_TASK_CONFIG_PATH: "configs/vistargetnav_gibson.yaml"
IL_TRAINER_NAME: "BC_trainer"
RL_TRAINER_NAME: "PPOTrainer_Memory_aux"
ENV_NAME: "SearchEnv"

SIMULATOR_GPU_ID: 1
TORCH_GPU_ID: 1

NUM_PROCESSES: 4
NUM_VAL_PROCESSES: 0

SENSORS: ["DEPTH_SENSOR", "RGB_SENSOR"]

LOG_INTERVAL: 100
CHECKPOINT_INTERVAL: 200
VIS_INTERVAL: 200

OBS_TO_SAVE: ['global_memory', 'global_mask', 'global_A', 'global_time',
              'panoramic_rgb', 'panoramic_depth','goal_embedding', 'episode_info', 'target_goal',
              'step', 'have_been', 'target_dist_score']
POLICY: 'VGMPolicy'
WRAPPER: 'GraphWrapper'

GCN:
  TYPE: "GATv2"
  ENV_GLOBAL_NODE_MODE: "embedding"
  RANDOMINIT_ENV_GLOBAL_NODE: False
  RANDOM_REPLACE: False # default to False
  ENV_GLOBAL_NODE_LINK_RANGE: -1.0 # 0.2, 0.5, 0.8 # default to -1.0

memory:
  FORGET: False
  TRAINING_FORGET: False
  FORGETTING_TYPE: "simple"
  FORGETTING_ATTN: "goal" # "goal", "cur", "global_node" # default to "goal"
  RANK: "bottom" # "top", "bottom"
  RANK_THRESHOLD: 0.2
  TOLERANCE: 1
  RANDOM_SELECT: False # Default to False

transformer:
  DECODE_GLOBAL_NODE: True  # Default to True


REWARD_METHOD: 'progress'
USE_AUXILIARY_INFO: True

BC:
  max_epoch: 100 # defalt to 100
  batch_size: 16
  num_workers: 8

RL:
  SUCCESS_REWARD: 10.0
  SUCESS_MEASURE: 'SUCCESS'
  SLACK_REWARD: -0.001
  PPO:
    num_mini_batch: 2
    num_steps: 256
    rl_pretrained: False
    il_pretrained: True
    pretrained_weights: "data/new_checkpoints/GATv2_EnvGlobalNode_Emb_ILRL_IL/epoch0023iter20000.pt"
