#!/bin/bash
#SBATCH --job-name=Eval_shortgpt_qwen3-4b-instruct_calibarcc_zeroshot_allmodel    # 作业名
#SBATCH --partition=lvjq                  # 队列
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=6
#SBATCH --gres=gpu:1                  
#SBATCH -o %J.out
#SBATCH -e %J.err

module load anaconda3
source activate come


export CUDA_HOME=/usr/local/cuda
export PATH=$CUDA_HOME/bin:$PATH
export LD_LIBRARY_PATH=$CUDA_HOME/lib64:$LD_LIBRARY_PATH

PYTHON=~/.conda/envs/come/bin/python
export TOKENIZERS_PARALLELISM=false

MASTER_ADDR=localhost
MASTER_PORT=40022
GPUS_PER_NODE=1


SFT_DATASET_LIST=(
  "arc_challenge"
  "arc_easy"
  "hellaswag"
  "mmlu"
  "boolq"
  "piqa"
  "winogrande"
  "xsum"
)


FINETUNED_MODEL_BASE_PATH=/TO/MY/PATH/code/Understanding_Performance_Collapse/pruned_models/qwen3-4b-instruct/shortgpt/arc_challenge
FINETUNED_MODEL_FILE_LIST=(
  # "qwen3-4b-instruct-0.028/Qwen3-4B-Instruct-2507-modelscope_shortgpt_35"
  # "qwen3-4b-instruct-0.056/Qwen3-4B-Instruct-2507-modelscope_shortgpt_34"
  # "qwen3-4b-instruct-0.083/Qwen3-4B-Instruct-2507-modelscope_shortgpt_33"
  "qwen3-4b-instruct-0.111/Qwen3-4B-Instruct-2507-modelscope_shortgpt_32"
  # "qwen3-4b-instruct-0.139/Qwen3-4B-Instruct-2507-modelscope_shortgpt_31"
  # "qwen3-4b-instruct-0.167/Qwen3-4B-Instruct-2507-modelscope_shortgpt_30"
  "qwen3-4b-instruct-0.194/Qwen3-4B-Instruct-2507-modelscope_shortgpt_29"
  # "qwen3-4b-instruct-0.222/Qwen3-4B-Instruct-2507-modelscope_shortgpt_28"
  # "qwen3-4b-instruct-0.25/Qwen3-4B-Instruct-2507-modelscope_shortgpt_27"
  # "qwen3-4b-instruct-0.278/Qwen3-4B-Instruct-2507-modelscope_shortgpt_26"
  "qwen3-4b-instruct-0.306/Qwen3-4B-Instruct-2507-modelscope_shortgpt_25"
  # "qwen3-4b-instruct-0.333/Qwen3-4B-Instruct-2507-modelscope_shortgpt_24"
  # "qwen3-4b-instruct-0.361/Qwen3-4B-Instruct-2507-modelscope_shortgpt_23"
  # "qwen3-4b-instruct-0.389/Qwen3-4B-Instruct-2507-modelscope_shortgpt_22"
  # "qwen3-4b-instruct-0.417/Qwen3-4B-Instruct-2507-modelscope_shortgpt_21"
  # "qwen3-4b-instruct-0.444/Qwen3-4B-Instruct-2507-modelscope_shortgpt_20"
  # "qwen3-4b-instruct-0.472/Qwen3-4B-Instruct-2507-modelscope_shortgpt_19"
  # "qwen3-4b-instruct-0.5/Qwen3-4B-Instruct-2507-modelscope_shortgpt_18"
  # "qwen3-4b-instruct-0.528/Qwen3-4B-Instruct-2507-modelscope_shortgpt_17"
  # "qwen3-4b-instruct-0.556/Qwen3-4B-Instruct-2507-modelscope_shortgpt_16"
)
echo ">>> Starting batch evaluating for ${#FINETUNED_MODEL_FILE_LIST[@]} models..."

for SFT_DATASET in "${SFT_DATASET_LIST[@]}"; do
  echo ">>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>Start eval ${SFT_DATASET}<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<"

  for FINETUNED_MODEL_FILE in "${FINETUNED_MODEL_FILE_LIST[@]}"; do
      FINETUNED_MODEL_PATH=${FINETUNED_MODEL_BASE_PATH}/${FINETUNED_MODEL_FILE}
      OUTPUT_DIR=/TO/MY/PATH/code/Understanding_Performance_Collapse/shortgpt_outputs/calib_arcc/eval/qwen3-4b-instruct_zeroshot/${FINETUNED_MODEL_FILE}

      torchrun --nproc_per_node=${GPUS_PER_NODE} --master_addr ${MASTER_ADDR} --master_port ${MASTER_PORT} /TO/MY/PATH/code/Understanding_Performance_Collapse/TALE/evaluate_pruned_llm.py \
        --model_name_or_path ${FINETUNED_MODEL_PATH} \
        --output_dir  ${OUTPUT_DIR} \
        --deepspeed_config /TO/MY/PATH/code/Understanding_Performance_Collapse/TALE/ds_config.json \
        --sft_dataset ${SFT_DATASET} \
        --eval_split test \
        --per_device_eval_batch_size 4
  done
  echo ">>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>End eval ${SFT_DATASET}<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<"
done

echo ">>> All evaluating tasks completed!"
