#!/bin/bash
#SBATCH --job-name=Eval_ITPrun_llama3_zeroshot_allmodel_mmlu    # 作业名
#SBATCH --partition=lvjq                  # 队列
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=6
#SBATCH --gres=gpu:1
#SBATCH -o %J.out
#SBATCH -e %J.err

module load anaconda3
source activate come

export CUDA_HOME=/usr/local/cuda
export PATH=$CUDA_HOME/bin:$PATH
export LD_LIBRARY_PATH=$CUDA_HOME/lib64:$LD_LIBRARY_PATH

PYTHON=~/.conda/envs/come/bin/python
export TOKENIZERS_PARALLELISM=false

MASTER_ADDR=localhost
MASTER_PORT=30021
GPUS_PER_NODE=1

SFT_DATASET_LIST=(
  "mmlu"
)
#   "hellaswag"
#   "piqa" # 保存winogrande中
#   "winogrande"  # 保存在winogrande_true中
#   "mmlu"
#   "boolq"
#   "arc_easy"

# =========================
# 需要评估的权重（完整路径）
# =========================
FINETUNED_MODEL_PATH_LIST=(
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-31Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_31"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-31Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_30"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-31Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_29"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-31Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_28"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-31Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_27"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-31Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_26"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-31Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_25"
  /TO/MY/PATH/code/Understanding_Performance_Collapse/pruned_models/llama3-8b/shortgpt/calib_mmlu/llama3-8b-0.25/Meta-Llama-3.1-8B-Instruct_shortgpt_24
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-24Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt_23"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-24Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt_22"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-24Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt_21"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-24Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt_20"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-24Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt_19"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-24Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt_18"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-24Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt_17"
  # "/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-24Layer/Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt_16"
)

# 输出根目录（与你原先保持一致风格）
EVAL_OUT_ROOT="/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_arc_challenge/llama3-8b/eval/Llama3.1-8B-Instruct_zeroshot_all_model/mmlu"

echo ">>> Starting batch evaluating for ${#FINETUNED_MODEL_PATH_LIST[@]} models..."

for SFT_DATASET in "${SFT_DATASET_LIST[@]}"; do
  echo ">>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>Start eval ${SFT_DATASET}<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<"

  for FINETUNED_MODEL_PATH in "${FINETUNED_MODEL_PATH_LIST[@]}"; do
      FINETUNED_MODEL_FILE="$(basename "${FINETUNED_MODEL_PATH}")"
      OUTPUT_DIR="${EVAL_OUT_ROOT}/${FINETUNED_MODEL_FILE}"

      torchrun --nproc_per_node=${GPUS_PER_NODE} \
        --master_addr ${MASTER_ADDR} \
        --master_port ${MASTER_PORT} \
        /TO/MY/PATH/code/Understanding_Performance_Collapse/TALE/evaluate_pruned_llm.py \
        --model_name_or_path ${FINETUNED_MODEL_PATH} \
        --output_dir  ${OUTPUT_DIR} \
        --deepspeed_config /TO/MY/PATH/code/Understanding_Performance_Collapse/TALE/ds_config.json \
        --sft_dataset ${SFT_DATASET} \
        --eval_split test \
        --per_device_eval_batch_size 4
  done

  echo ">>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>End eval ${SFT_DATASET}<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<"
done

echo ">>> All evaluating tasks completed!"
