DATA_ROOT=../datasets

train_alg=dagger

features=clip.b16
ft_dim=512
obj_features=vitbase
obj_ft_dim=768

ngpus=1
bs=16
seed=0

name=${train_alg}-${features}
name=${name}-seed.${seed}

name=${name}-aug.mp3d.prevalent.temporal-2k
outdir=${DATA_ROOT}/R2R/exprs_map/finetune/${name}-pretrained


flag="--root_dir ${DATA_ROOT}
      --dataset r2r
      --output_dir ${outdir}
      --world_size ${ngpus}
      --seed ${seed}
      --tokenizer bert      

      --enc_full_graph
      --graph_sprels
      --fusion dynamic

      --expert_policy spl
      --train_alg ${train_alg}
      
      --num_l_layers 9
      --num_x_layers 4
      --num_pano_layers 2
      
      --max_action_len 15
      --max_instr_len 200
      --train_env_names train
      --val_env_names val_seen val_unseen 

      --batch_size ${bs}
      --lr 1e-5
      --iters 50000
      --log_every 500
      --aug_times 9

      --optim adamW

      --use_lora False

      --features ${features}
      --image_feat_size ${ft_dim}
      --angle_feat_size 4

      --ml_weight 0.15

      --feat_dropout 0.4
      --dropout 0.5
      
      --gamma 0."

# train
CUDA_VISIBLE_DEVICES=$1 python r2r/main_nav.py $flag  \
      --tokenizer bert \
      --bert_ckpt_file ../datasets/R2R/trained_models/pretrain/duet_vit-b16_model_step_140000.pt \
      --aug ../datasets/R2R/annotations/R2R_scalevln_ft_aug_enc.json \
      --train_env_names train temporal_gpt4o_train_2k  \
      --val_env_names val_seen val_unseen \
      --batch_size 16 \

    

     

