#!/bin/bash
#SBATCH --job-name=Eval_shortgpt_llama3_mmlu_zeroshot    # 作业名
#SBATCH --partition=lvjq                  # 队列
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=6
#SBATCH --gres=gpu:1                  
#SBATCH -o %J.out
#SBATCH -e %J.err

module load anaconda3
source activate come


export CUDA_HOME=/usr/local/cuda
export PATH=$CUDA_HOME/bin:$PATH
export LD_LIBRARY_PATH=$CUDA_HOME/lib64:$LD_LIBRARY_PATH

PYTHON=~/.conda/envs/come/bin/python
export TOKENIZERS_PARALLELISM=false

MASTER_ADDR=localhost
MASTER_PORT=4002
GPUS_PER_NODE=1


SFT_DATASET=xsum
FINETUNED_MODEL_BASE_PATH=/TO/MY/PATH/code/Understanding_Performance_Collapse/shortgpt_outputs/calib_arcc/finetune/Llama3.1-8B-Instruct/
FINETUNED_MODEL_FILE_LIST=(
  "${SFT_DATASET}/llama3-8b-0.312/Meta-Llama-3.1-8B-Instruct_shortgpt_22_lr5e-5_bs1_ep3/final"
  "${SFT_DATASET}/llama3-8b-0.219/Meta-Llama-3.1-8B-Instruct_shortgpt_25_lr5e-5_bs1_ep3/final"
  "${SFT_DATASET}/llama3-8b-0.125/Meta-Llama-3.1-8B-Instruct_shortgpt_28_lr5e-5_bs1_ep3/final"
  # "${SFT_DATASET}/llama3-8b-0.031/Meta-Llama-3.1-8B-Instruct_shortgpt_31_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.062/Meta-Llama-3.1-8B-Instruct_shortgpt_30_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.094/Meta-Llama-3.1-8B-Instruct_shortgpt_29_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.156/Meta-Llama-3.1-8B-Instruct_shortgpt_27_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.188/Meta-Llama-3.1-8B-Instruct_shortgpt_26_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.25/Meta-Llama-3.1-8B-Instruct_shortgpt_24_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.281/Meta-Llama-3.1-8B-Instruct_shortgpt_23_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.344/Meta-Llama-3.1-8B-Instruct_shortgpt_21_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.375/Meta-Llama-3.1-8B-Instruct_shortgpt_20_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.406/Meta-Llama-3.1-8B-Instruct_shortgpt_19_bs2_newlr/final"
  # "${SFT_DATASET}/llama3-8b-0.438/Meta-Llama-3.1-8B-Instruct_shortgpt_18_bs2_newlr/final"
)

echo ">>> Starting batch evaluating for ${#FINETUNED_MODEL_FILE_LIST[@]} models..."

for FINETUNED_MODEL_FILE in "${FINETUNED_MODEL_FILE_LIST[@]}"; do

    FINETUNED_MODEL_PATH=${FINETUNED_MODEL_BASE_PATH}/${FINETUNED_MODEL_FILE}
    OUTPUT_DIR=/TO/MY/PATH/code/Understanding_Performance_Collapse/shortgpt_outputs/calib_arcc/eval/Llama3.1-8B-Instruct/${FINETUNED_MODEL_FILE}

    torchrun --nproc_per_node=${GPUS_PER_NODE} --master_addr ${MASTER_ADDR} --master_port ${MASTER_PORT} /TO/MY/PATH/code/Understanding_Performance_Collapse/TALE/evaluate_pruned_llm.py \
      --model_name_or_path ${FINETUNED_MODEL_PATH} \
      --output_dir  ${OUTPUT_DIR} \
      --deepspeed_config /TO/MY/PATH/code/Understanding_Performance_Collapse/TALE/ds_config.json \
      --sft_dataset ${SFT_DATASET} \
      --eval_split test \
      --per_device_eval_batch_size 4
done

echo ">>> All evaluating tasks completed!"
