DATA_ROOT=../datasets

train_alg=dagger

features=clip.b16
ft_dim=512
obj_features=vitbase
obj_ft_dim=768

ngpus=1
bs=16
seed=0

name=${train_alg}-${features}
name=${name}-seed.${seed}


name=${name}-aug.mp3d.prevalent.moe-top1-routing-add_prev_sub_instructions
outdir=${DATA_ROOT}/R2R/exprs_map/multi-models/${name}

flag="--root_dir ${DATA_ROOT}
      --dataset r2r
      --output_dir ${outdir}
      --world_size ${ngpus}
      --seed ${seed}
      --tokenizer bert      

      --enc_full_graph
      --graph_sprels
      --fusion dynamic

      --expert_policy spl
      --train_alg ${train_alg}
      
      --num_l_layers 9
      --num_x_layers 4
      --num_pano_layers 2
      
      --max_action_len 15
      --max_instr_len 200
      --train_env_names train 
      --val_env_names val_seen val_unseen 

      --batch_size ${bs}
      --lr 1e-5
      --iters 50000
      --log_every 500
      --aug_times 9

      --optim adamW

      --use_lora False
      --lora_r 8
      --lora_alpha 16
      --lora_target_modules query key value

      --features ${features}
      --image_feat_size ${ft_dim}
      --angle_feat_size 4

      --ml_weight 0.15

      --feat_dropout 0.4
      --dropout 0.5
      
      --gamma 0."
      

# Run main inference script
echo "Running main_nav_moe_top1.py..."

# test
CUDA_VISIBLE_DEVICES=$1 python moe/main_nav_moe_top1.py $flag  \
        --tokenizer bert \
        --test \
        --bert_ckpt_file ${DATA_ROOT}/R2R/trained_models/pretrain/duet_vit-b16_model_step_140000.pt \
        --submit \
        --feedback argmax \
        --batch_size 8 \
        --routing_mode top1 \
        --routing_weights_type int \
        --resume_files  ../datasets/R2R/exprs_map/finetune/dagger-clip.b16-seed.0-aug.mp3d.prevalent.temporal-aug.direction-resized-pretrained/ckpts/best_val_unseen \
                        ../datasets/R2R/exprs_map/finetune/dagger-clip.b16-seed.0-aug.mp3d.prevalent.temporal-aug.vertical-resized-pretrained/ckpts/best_val_unseen \
                        ../datasets/R2R/exprs_map/finetune/dagger-clip.b16-seed.0-aug.mp3d.prevalent.temporal-aug.stop-resized-pretrained/ckpts/best_val_unseen \
                        ../datasets/R2R/exprs_map/finetune/dagger-clip.b16-seed.0-aug.mp3d.prevalent.temporal-aug.landmark-resized-pretrained/ckpts/best_val_unseen \
                        ../datasets/R2R/exprs_map/finetune/dagger-clip.b16-seed.0-aug.mp3d.prevalent.temporal-aug.region-resized-pretrained/ckpts/best_val_unseen \
                        ../datasets/R2R/exprs_map/finetune/dagger-clip.b16-seed.0-aug.mp3d.prevalent.temporal-re-2k-pretrained/ckpts/best_val_unseen \
                        ../datasets/R2R/trained_models/finetune/duet_vit-b16_ft_best_val_unseen \
        --resume_weights 1 1 1 1 1 0 0 \
        --train_env_names val_unseen_debug \
        --val_env_names test \
        --localizer_gpu_id 1 \
        --skill_gpu_id 2

