# @package _global_

# Copyright (c) 2023 Boston Dynamics AI Institute LLC. All rights reserved.

defaults:
  - /habitat_baselines: habitat_baselines_rl_config_base
  - /benchmark/nav/objectnav: objectnav_hm3d
  - /habitat/task/lab_sensors:
      - base_explorer
      - compass_sensor
      - gps_sensor
      - heading_sensor
      - frontier_sensor
  - /habitat/task/measurements:
    - frontier_exploration_map
    - traveled_stairs
  - /habitat_baselines/rl/policy: beliefmap_policy
  - _self_

habitat:
  environment:
    iterator_options:
      max_scene_repeat_steps: 50000
      shuffle: False
  # dataset:
  #   data_path: "data/datasets/objectnav/hm3d/v1/{split}/{split}.json.gz"
  #   start_episode_id: 26  # 从第100个episode开始评估
  task:
    success_reward: 2.5
    slack_reward: -1e-3
    lab_sensors:
      base_explorer:
        turn_angle: 30
      gps_sensor:
        type: GPSSensor
        dimensionality: 3
    constraint_violation_ends_episode: false
    count_obj_collisions: false
habitat_baselines:
  evaluate: True
  eval_ckpt_path_dir: data/dummy_policy.pth
  num_environments: 1
  load_resume_state_config: False

  torch_gpu_id: 0
  tensorboard_dir: "tb"
  video_dir: "video_dir"
  test_episode_count: -1
  checkpoint_folder: "data/new_checkpoints"
  checkpoint_interval: 10
  trainer_name: "beliefmap"
  num_updates: 270000
  log_interval: 10
  num_checkpoints: -1
  # Force PyTorch to be single threaded as
  # this improves performance considerably
  force_torch_single_threaded: True

  eval:
    split: "val"

  rl:

    policy:
      name: "HabitatITMPolicyV2"

    ppo:
      # ppo params
      clip_param: 0.2
      ppo_epoch: 4
      num_mini_batch: 2
      value_loss_coef: 0.5
      entropy_coef: 0.01
      lr: 2.5e-4
      eps: 1e-5
      max_grad_norm: 0.2
      num_steps: 64
      use_gae: True
      gamma: 0.99
      tau: 0.95
      use_linear_clip_decay: False
      use_linear_lr_decay: False
      reward_window_size: 50

      use_normalized_advantage: False

      hidden_size: 512

    ddppo:
      sync_frac: 0.6
      # The PyTorch distributed backend to use
      distrib_backend: NCCL
      # Visual encoder backbone
      pretrained_weights: data/ddppo-models/gibson-2plus-resnet50.pth
      # Initialize with pretrained weights
      pretrained: False
      # Initialize just the visual encoder backbone with pretrained weights
      pretrained_encoder: False
      # Whether or not the visual encoder backbone will be trained.
      train_encoder: True
      # Whether or not to reset the critic linear layer
      reset_critic: False

      # Model parameters
      backbone: resnet50
      rnn_type: LSTM
      num_recurrent_layers: 2
