# for original pointgoal dataset
dataset_type: PointNav-v1 # for pointgoal dataset
split: val_mini  #[train, val, val_mini] # for pointgoal dataset
dataset_path: "/dataset/pointnav_gibson_v1/{split}/{split}.json.gz" # where pointgoal episode split data store
pointgoal_dataset_path: "/dataset/pointnav_gibson_v1"
content_scenes: ["*"]
scenes_dir: "/dataset"
# -----------------------------------------------
# BC training data location
behavior_dataset_path: "/dataset/behavior_dataset_gibson_1_scene_Rancocas_2000"  # where imitation learning dataset store
# Image training data location
image_dataset_path: "/dataset/image_dataset_gibson"

# experiments
algorithm_name: "rnn_bc"
experiment_name: "rel_goal_1_scene_Rancocas_2000_adamw_tau_1"
log_to_wandb: false

# dummy initial setup 
scene_id: ~/habitat-sim/data/scene_datasets/habitat-test-scenes/van-gogh-room.glb
agent_initial_position: [3, 0, 1]
agent_initial_rotation: [0, 70, 0]
goal_position: [4, 0, -1]

# dummy for saving render images
eval_video_option: [] 


# robot
forward_resolution: 0.25 # meter
rotate_resolution: 10 # degree
action_number: 4 

# observation space (env)
state_sensor: true
color_sensor: true
depth_sensor: false 
semantic_sensor: false
image_width: 224 
image_height: 224 
normalize_depth: true # if true, scale depth to [0,1] according to min and max depth
min_depth: 0
max_depth: 10.0 
dictionary_observation_space: true

# task
measurements: ['steps', 'collisions', 'distance_to_goal', 'success', 'done', 'spl', 'softspl', 'point_goal_reward', 'return']

# state
state_coord_system: polar # [polar, cartesian]
state_dimension: 2 
cos_augmented_state: false 
state_relative_to_origin: true
state_only: false # only use state as input to the agent

# goal
goal_conditioned: true  # enable goal sensor
goal_format: pointgoal # imagegoal #pointgoal
goal_relative_to_origin: false
goal_gps_compass: true # false use absolute goal location relative to the start location
goal_coord_system: polar # [polar, cartesian]
goal_dimension: 2 
cos_augmented_goal: false

# reward
success_distance: 0.2 # l2 distance in meter
success_reward: 2.5  
slack_reward: -1.0e-4 
goal_reward: true 
stop_depend_success: true

# episode termination condition (environment)
max_steps_per_episode: 500
max_collisions_per_episode: 200

# seed
seed: 1

# gpu
gpu_id: 1 

# vector env (for evaluation only)
num_environments: 14 

# bc rnn policy
rnn_hidden_size: 512
obs_embedding_size: 512
goal_embedding_size: 32
act_embedding_size: 32
rnn_type: 'gru'
goal_form:  "rel_goal" # ["rel_goal", "distance_to_goal", "abs_goal"]

# batch
batch_mode: "whole_trajectory" #["random_segment", "whole_trajectory", "partial_trajectory"]

# training
batch_size: 4 # amount to the number of vector envs during training
optimizer: "AdamW" #["AdamW", "Adam"]
learning_rate: 1.0e-4 
weight_decay: 1.0e-4
max_epochs: 200 
use_augment_train_data: false
supervise_value: false
domain_adaptation: false
temperature: 1.0
action_type: "cartesian" #["cartesian", "polar"]

# evaluate during training
eval_during_training: false
eval_every_epochs: 10 
eval_during_training_sample: true
eval_during_training_splits: ["same_start_goal_val_mini", "same_scene_val_mini", "across_scene_val_mini"]
eval_use_vector_envs: true 

# save checkpoint
save_every_epochs: 10 

# evaluation
eval_experiment_folder: "rnn_bc-rel_goal_4_scene_rancocas_2000_epoch_200_aug-s1"
eval_checkpoint_file: ["ckpt_3.pth", "ckpt_5.pth", "ckpt_10.pth", "ckpt_15.pth", "ckpt_19.pth"] 
eval_dir: "evaluation"













