evaluate: false
trainer_name: ppo
updater_name: PPO
distrib_updater_name: DDPPO
torch_gpu_id: 0
tensorboard_dir: tb
writer_type: tb
video_dir: video_dir
video_fps: 10
test_episode_count: -1
eval_ckpt_path_dir: data/checkpoints
num_environments: 1
num_processes: -1
rollout_storage_name: RolloutStorage
checkpoint_folder: data/checkpoints
num_updates: 10000
num_checkpoints: 10
checkpoint_interval: -1
total_num_steps: -1.0
log_interval: 10
log_file: train.log
force_blind_policy: false
verbose: true
vector_env_factory:
  _target_: habitat_baselines.common.HabitatVectorEnvFactory
eval_keys_to_include_in_name: []
force_torch_single_threaded: false
wb:
  project_name: ''
  entity: ''
  group: ''
  run_name: ''
load_resume_state_config: true
eval:
  split: val
  use_ckpt_config: true
  should_load_ckpt: true
  evals_per_ep: 1
  video_option: []
  extra_sim_sensors: {}
profiling:
  capture_start_step: -1
  num_steps_to_capture: -1
should_log_single_proc_infos: false
on_save_ckpt_callback: null
rl:
  agent:
    type: SingleAgentAccessMgr
  preemption:
    append_slurm_job_id: false
    save_resume_state_interval: 100
    save_state_batch_only: false
  policy:
    name: PointNavResNetPolicy
    action_distribution_type: categorical
    action_dist:
      use_log_std: true
      use_softplus: false
      std_init: -1
      log_std_init: 0.0
      use_std_param: false
      clamp_std: true
      min_std: 1.0e-06
      max_std: 1
      min_log_std: -5
      max_log_std: 2
      action_activation: tanh
      scheduled_std: false
    obs_transforms: {}
    # hierarchical_policy: ???
    ovrl: false
    no_downscaling: false
    use_augmentations: false
    deterministic_actions: false
  ppo:
    clip_param: 0.2
    ppo_epoch: 4
    num_mini_batch: 2
    value_loss_coef: 0.5
    entropy_coef: 0.01
    lr: 0.00025
    eps: 1.0e-05
    max_grad_norm: 0.5
    num_steps: 5
    use_gae: true
    use_linear_lr_decay: false
    use_linear_clip_decay: false
    gamma: 0.99
    tau: 0.95
    reward_window_size: 50
    use_normalized_advantage: false
    hidden_size: 512
    entropy_target_factor: 0.0
    use_adaptive_entropy_pen: false
    use_clipped_value_loss: true
    use_double_buffered_sampler: false
  ddppo:
    sync_frac: 0.6
    distrib_backend: GLOO
    rnn_type: GRU
    num_recurrent_layers: 1
    backbone: resnet18
    pretrained_weights: data/ddppo-models/gibson-2plus-resnet50.pth
    pretrained: false
    pretrained_encoder: false
    train_encoder: true
    reset_critic: true
    force_distributed: false
    normalize_visual_inputs: false
  ver:
    variable_experience: true
    num_inference_workers: 2
    overlap_rollouts_and_learn: false
  auxiliary_losses: {}
