source scripts/common_setting.sh

tune_ckpt_path="pudding"

base_models=(
  "$llama2"
  "$llama2"
  "$llama2"
  "$llama2"
)

model_names=(
  "llama2"
  "llama2"
  "llama2"
  "llama2"
)

data_paths=(
  "yahma/alpaca-cleaned"
#  "yahma/alpaca-cleaned"
#  "yahma/alpaca-cleaned"
#  "yahma/alpaca-cleaned"
)

data_names=(
  "alpaca"
  "alpaca"
  "alpaca"
  "alpaca"
)

num_remove_blocks=(
  4
#  8 12 16
)

lora_r=8
gpu_ids=(4 5 6 7)

run_tuning_and_evaluation(){
  local gpu_id=$1
  local base_model=$2
  local model_name=$3
  local data_path=$4
  local data_name=$5
  local remove_blocks=$6

  base_path=baselines/PuDDing
  open_path=tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/analysis/llama_layer_list_6_advanced_tasks.csv

  ################# generate layerset
  #  CUDA_VISIBLE_DEVICES=3 python ${base_path}/codes/4_layerset/_4_sleb_easy_likelihood.py --result_folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/analysis/arc_easy --model_name ${base_model} --num_remove_blocks ${remove_blocks}
  #  CUDA_VISIBLE_DEVICES=4 python ${base_path}/codes/4_layerset/_4_sleb_challenge_likelihood.py --result_folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/analysis/arc_challenge --model_name ${base_model} --num_remove_blocks ${remove_blocks}
  #  CUDA_VISIBLE_DEVICES=3 python ${base_path}/codes/4_layerset/_4_sleb_piqa_likelihood.py --result_folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/analysis/piqa --model_name ${base_model} --num_remove_blocks ${remove_blocks}
  #  CUDA_VISIBLE_DEVICES=4 python ${base_path}/codes/4_layerset/_4_sleb_hellaswag_likelihood.py --result_folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/analysis/hellaswag --model_name ${base_model} --num_remove_blocks ${remove_blocks}
  #  CUDA_VISIBLE_DEVICES=3 python ${base_path}/codes/4_layerset/_4_sleb_winogrande_likelihood.py --result_folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/analysis/winogrande --model_name ${base_model} --num_remove_blocks ${remove_blocks}
  #  CUDA_VISIBLE_DEVICES=4 python ${base_path}/codes/4_layerset/_4_sleb_boolq_likelihood.py --result_folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/analysis/boolq --model_name ${base_model} --num_remove_blocks ${remove_blocks}

  ################# generate datasets

  #CUDA_VISIBLE_DEVICES=3 python ${base_path}/codes/5_dataset/1_log/_5_adaptive_cluster_log_easy.py --model_name ${base_model} --folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/data/arc_easy --open_path ${open_path}
  #CUDA_VISIBLE_DEVICES=3 python ${base_path}/codes/5_dataset/1_log/_5_adaptive_cluster_log_challenge.py --model_name ${base_model} --folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/data/arc_challenge --open_path ${open_path}
  #CUDA_VISIBLE_DEVICES=3 python ${base_path}/codes/5_dataset/1_log/_5_adaptive_cluster_log_piqa.py --model_name ${base_model} --folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/data/piqa --open_path ${open_path}
  #CUDA_VISIBLE_DEVICES=3 python ${base_path}/codes/5_dataset/1_log/_5_adaptive_cluster_log_hellaswag.py --model_name ${base_model} --folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/data/hellaswag --open_path ${open_path}
  #CUDA_VISIBLE_DEVICES=3 python ${base_path}/codes/5_dataset/1_log/_5_adaptive_cluster_log_winogrande_aug_1.py --model_name ${base_model} --folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/data/winogrande --open_path ${open_path}
  #CUDA_VISIBLE_DEVICES=3 python ${base_path}/codes/5_dataset/1_log/_5_adaptive_cluster_log_boolq.py --model_name ${base_model} --folder tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/data/boolq --open_path ${open_path}
#  python ${base_path}/merge_datasets.py --folder_path tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/data/

  ################# train router
#  CUDA_VISIBLE_DEVICES=$gpu_id python baselines/PuDDing/3_train_BERT_likelihood_MSE.py \
#    --epochs 10 \
#    --num_classes 6 \
#    --csv_files tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/data/all_log.csv \
#    --output_dir tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/router

  ################# finetune layerset with lora

#  layerset_idxs=(0 1 2 3 4 5)
#  inner_gpu_ids=(2 3 4 5)
#
#  for ((k=0; k<${#layerset_idxs[@]}; k+=4)); do
#    for l in "${!inner_gpu_ids[@]}"; do
#        idx=$((k+l))
#        if ((idx>=${#layerset_idxs[@]}));then
#          break
#        fi
#
#        echo "gpu ${inner_gpu_ids[$l]}, ${open_path}, ${layerset_idxs[$idx]}"
#        CUDA_VISIBLE_DEVICES=${inner_gpu_ids[$l]} python baselines/PuDDing/finetune.py \
#          --base_model $base_model \
#          --data_name $data_name \
#          --data_path $data_path \
#          --num_remove_blocks ${remove_blocks} \
#          --output_dir tune_log/$model_name/${tune_ckpt_path}_${remove_blocks}/${data_name}_lora${lora_r}_${layerset_idxs[$idx]}/ \
#          --lora_r $lora_r \
#          --cutoff_len 512 \
#          --num_epochs 2 \
#          --layerset_path ${open_path} \
#          --layerset_idx ${layerset_idxs[$idx]} \
#          --learning_rate 1e-4 \
#          --batch_size 8 &
#    done
#    wait  # Wait for all tuning and evaluation processes to finish
#  done


 # ---------------- eval acc ------------------
#  open_path=tune_log/${model_name}/${tune_ckpt_path}_${remove_blocks}/analysis/llama_layer_list_6_advanced_tasks.csv
#  CUDA_VISIBLE_DEVICES=${gpu_id} python baselines/PuDDing/zero_shot_eval.py \
#      --model hf \
#      --pretrained $base_model \
#      --peft=tune_log/$model_name/${tune_ckpt_path}_${remove_blocks}/ \
#      --num_remove_blocks ${remove_blocks} \
#      --layerset_path ${open_path} \
#      --device cuda:0 \
#      --batch_size 1 \
#      --tasks openbookqa,piqa,boolq,social_iqa,hellaswag,arc_easy,winogrande,arc_challenge \
#      --output_path results/$model_name/${tune_ckpt_path}_${remove_blocks}_lora${lora_r}/$data_name/

  # ---------------- eval ppl ------------------
  echo "base_model: ${base_model}"
  current_time=$(date "+%Y-%m-%d %H:%M:%S")
  echo "Start evaluation on gpu: $gpu_id, $current_time"

  CUDA_VISIBLE_DEVICES=$gpu_id python eval_metric.py \
      --name ${tune_ckpt_path} \
      --base_model $base_model \
      --peft=tune_log/$model_name/${tune_ckpt_path}_${remove_blocks}/ \
      --layerset_path ${open_path} \
      --num_remove_blocks ${remove_blocks} \
      --tasks wikitext2,ptb \
      --batch_size 4 \
      --cutoff_len 256 \
      --output_path results/$model_name/${tune_ckpt_path}_${remove_blocks}_lora${lora_r}/$data_name/

  current_time=$(date "+%Y-%m-%d %H:%M:%S")
  echo "End evaluation on gpu: $gpu_id, $current_time"
}

for ((j=0; j<${#data_paths[@]}; j+=4)); do
  for i in "${!gpu_ids[@]}"; do
      idx=$((j+i))
      if ((idx>=${#data_paths[@]}));then
        break
      fi

      gpu_id=${gpu_ids[$i]}
      base_model=${base_models[$idx]}
      model_name=${model_names[$idx]}
      data_path=${data_paths[$idx]}
      data_name=${data_names[$idx]}
      remove_blocks=${num_remove_blocks[$idx]}

      run_tuning_and_evaluation "$gpu_id" "$base_model" "$model_name" "$data_path" "$data_name" "$remove_blocks" &
  done
  wait  # Wait for all tuning and evaluation processes to finish
done