#!/bin/bash
#SBATCH --job-name=per_layer_margin_eval_sweep
#SBATCH --partition=lvjq
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=3
#SBATCH --gres=gpu:1
#SBATCH -o %J.out
#SBATCH -e %J.err

module load anaconda3
source activate come_llama2

export CUDA_HOME=/usr/local/cuda
export PATH=$CUDA_HOME/bin:$PATH
export LD_LIBRARY_PATH=$CUDA_HOME/lib64:$LD_LIBRARY_PATH
PYTHON=~/.conda/envs/come_llama2/bin/python

DENSE=/TO/MY/PATH/ckpt/llama2-7b-chat-hf
# arc_easy 
DATA=/TO/MY/PATH/MyDatasets/ARC-easy/test-00000-of-00001.parquet
# piqa DATA=/TO/MY/PATH/MyDatasets/PIQA/validation-00000-of-00001.parquet
# arc_challenge DATA=/TO/MY/PATH/MyDatasets/ARC-challenge/test-00000-of-00001.parquet
# hellaswag DATA=/TO/MY/PATH/MyDatasets/HellaS/data/validation-00000-of-00001.parquet
# winogrande DATA=/TO/MY/PATH/MyDatasets/WinoG/winogrande_xl/validation-00000-of-00001.parquet
# boolq DATA=/TO/MY/PATH/MyDatasets/BoolQ/data/validation-00000-of-00001.parquet

# output base dir
OUT_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/tools/results/0-llama2-7b-chat/arc_easy

########################calib_arc_challenge########################
# 映射：layer 30..25 <-> ratio 6.2..21.9
# No SFT
PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_arc_challenge/llama2-7b-chat-hf/prun/ContinuePrun-from-ShortGPT-31Layer
PRUNED_PREFIX=llama2-7b-chat-hf_shortgpt
LAYERS=(31 30 29 28 27 26 25 24)
RATIOS=(3.1 6.2 9.4 12.5 15.6 18.8 21.9 25)
for i in "${!LAYERS[@]}"; do
  layer="${LAYERS[$i]}"
  ratio="${RATIOS[$i]}"

  PRUNED="${PRUNED_BASE}/${PRUNED_PREFIX}_${layer}"
  OUT="${OUT_BASE}/margin_hellaswag_ratio_${ratio}%"

  echo "======================================================"
  echo "[Run $((i+1))/${#LAYERS[@]}] layer=${layer}, ratio=${ratio}%"
  echo "PRUNED=${PRUNED}"
  echo "OUT=${OUT}"
  echo "======================================================"

  mkdir -p "$OUT"

  $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
    --dense_model "$DENSE" \
    --pruned_model "$PRUNED" \
    --task arc_easy \
    --parquet "$DATA" \
    --split train \
    --limit 500 \
    --out_dir "$OUT"
done
echo "[Done] 32-24 layer."

PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/pruned_models/llama2-7b-chat-hf/shortgpt/calib_arc_challenge
PRUNED_PREFIX=llama2-7b-chat-hf-0.281/llama2-7b-chat-hf_shortgpt
LAYERS=(23)
RATIOS=(28.1)
for i in "${!LAYERS[@]}"; do
  layer="${LAYERS[$i]}"
  ratio="${RATIOS[$i]}"

  PRUNED="${PRUNED_BASE}/${PRUNED_PREFIX}_${layer}"
  OUT="${OUT_BASE}/margin_hellaswag_ratio_${ratio}%"

  echo "======================================================"
  echo "[Run $((i+1))/${#LAYERS[@]}] layer=${layer}, ratio=${ratio}%"
  echo "PRUNED=${PRUNED}"
  echo "OUT=${OUT}"
  echo "======================================================"

  mkdir -p "$OUT"

  $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
    --dense_model "$DENSE" \
    --pruned_model "$PRUNED" \
    --task arc_easy \
    --parquet "$DATA" \
    --split train \
    --limit 500 \
    --out_dir "$OUT"
done
echo "[Done] 23 layer."


PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_arc_challenge/llama2-7b-chat-hf/prun/ContinuePrun-from-ShortGPT-23Layer
PRUNED_PREFIX=llama2-7b-chat-hf_shortgpt_23_shortgpt
LAYERS=(22 21 20 19 18 17 16)
RATIOS=(31.2 34.4 37.5 40.6 43.8 46.88 50)

for i in "${!LAYERS[@]}"; do
  layer="${LAYERS[$i]}"
  ratio="${RATIOS[$i]}"

  PRUNED="${PRUNED_BASE}/${PRUNED_PREFIX}_${layer}"
  OUT="${OUT_BASE}/margin_hellaswag_ratio_${ratio}%"

  echo "======================================================"
  echo "[Run $((i+1))/${#LAYERS[@]}] layer=${layer}, ratio=${ratio}%"
  echo "PRUNED=${PRUNED}"
  echo "OUT=${OUT}"
  echo "======================================================"

  mkdir -p "$OUT"

  $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
    --dense_model "$DENSE" \
    --pruned_model "$PRUNED" \
    --task arc_easy \
    --parquet "$DATA" \
    --split train \
    --limit 500 \
    --out_dir "$OUT"
done

echo "[Done] All sweeps finished."


#####################################删除特定的层#####################################
  # Meta-Llama-3.1-8B-Instruct_manualrm_28-rm3_6
  # Meta-Llama-3.1-8B-Instruct_manualrm_28-rm4_7
  # Meta-Llama-3.1-8B-Instruct_manualrm_29-rm3_5 
  # Meta-Llama-3.1-8B-Instruct_manualrm_29-rm4_6
  # Meta-Llama-3.1-8B-Instruct_manualrm_29-rm5_7
  # Meta-Llama-3.1-8B-Instruct_manualrm_30-rm3_4
  # Meta-Llama-3.1-8B-Instruct_manualrm_30-rm4_5 
  # Meta-Llama-3.1-8B-Instruct_manualrm_30-rm5_6
  # Meta-Llama-3.1-8B-Instruct_manualrm_30-rm6_7
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm3 
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm4 
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm5 
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm6
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm7
# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/prun_specific_layer
# LAYERS=(
#   Meta-Llama-3.1-8B-Instruct_manualrm_28-rm3_6
#   Meta-Llama-3.1-8B-Instruct_manualrm_28-rm4_7
#   Meta-Llama-3.1-8B-Instruct_manualrm_29-rm4_6
#   Meta-Llama-3.1-8B-Instruct_manualrm_29-rm5_7
#   Meta-Llama-3.1-8B-Instruct_manualrm_30-rm5_6
# )

# for i in "${!LAYERS[@]}"; do
#   layer="${LAYERS[$i]}"
#   ratio="${RATIOS[$i]}"

#   PRUNED="${PRUNED_BASE}/${layer}/"
#   OUT="${OUT_BASE}/${layer}"

#   echo "======================================================"
#   echo "[Run $((i+1))/${#LAYERS[@]}] layer=${layer}"
#   echo "PRUNED=${PRUNED}"
#   echo "OUT=${OUT}"
#   echo "======================================================"

#   mkdir -p "$OUT"

#   $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
#     --dense_model "$DENSE" \
#     --pruned_model "$PRUNED" \
#     --task boolq \
#     --parquet "$DATA" \
#     --split train \
#     --limit 500 \
#     --out_dir "$OUT"
# done

# echo "[Done] All sweeps finished."
