project_name: IGNet

# training setup
# load_run: gnm/pretrained
use_wandb: True # set to false if you don't want to log to wandb
train: True
batch_size: 16
eval_batch_size: 16
epochs: 100
gpu_ids: [0] 
num_workers: 16
num_transformer_layers: 1
freeze_image_encoder: False
lr: 5e-5
optimizer: adam
seed: 0

# model params
encoder: MAE
contrast_embedding: True
disable_auxiliary: disable_position

# action output params
action_num: 8
len_trajectory_pred: 5

# dataset specific parameters
location_dataset_name: location-2000-v1
navigation_dataset_name: navigation-refine-v1
data_folder: ../map-pretrain-data
data_split_folder: ../map-pretrain-data/data-split
location_num: 2
min_query_num: 2
max_query_num: 2
generate_index_size_train: 4000
generate_index_size_val: 1000
goal_augment_prob: 0.5

# logging stuff
print_log_freq: 100 # in iterations
image_log_freq: 1000 # in iterations
num_images_log: 8 
pairwise_test_freq: 10 # in epochs

# All below are legacy configs, used in drive any robot

# context
# context_type: temporal
# context_size: 5

# tradeoff between action and distance prediction loss
# alpha: 0.5

# distance bounds for distance and action and distance predictions 
# distance:
#   min_dist_cat: 0
#   max_dist_cat: 20
# action:
#   min_dist_cat: 2
#   max_dist_cat: 10
# close_far_threshold: 10 # distance threshold used to seperate the close and the far  subgoals that are sampled per datapoint

# end_slack: 3 # because many trajectories end in collisions
# goals_per_obs: 1 # how many goals are sampled per observation
# negative_mining: True # negative mining from the ViNG paper (Shah et al.)

# image_size: [85, 64] # width, height

# normalization for the action space
# normalize: True