#!/bin/bash
#SBATCH --job-name=per_layer_margin
#SBATCH --partition=lvjq
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=3
#SBATCH --gres=gpu:1
#SBATCH -o %J.out
#SBATCH -e %J.err

module load anaconda3
source activate come_llama2

export CUDA_HOME=/usr/local/cuda
export PATH=$CUDA_HOME/bin:$PATH
export LD_LIBRARY_PATH=$CUDA_HOME/lib64:$LD_LIBRARY_PATH
PYTHON=~/.conda/envs/come_llama2/bin/python

# /seu_nvme/ogai/models/Meta-Llama-3.1-8B-Instruct
DENSE=/seu_nvme/ogai/models/Meta-Llama-3.1-8B-Instruct
# arc_easy DATA=/TO/MY/PATH/MyDatasets/ARC-easy/test-00000-of-00001.parquet
# piqa DATA=/TO/MY/PATH/MyDatasets/PIQA/validation-00000-of-00001.parquet
# arc_challenge DATA=/TO/MY/PATH/MyDatasets/ARC-challenge/test-00000-of-00001.parquet
# hellaswag 
DATA=/TO/MY/PATH/MyDatasets/HellaS/data/validation-00000-of-00001.parquet
# winogrande DATA=/TO/MY/PATH/MyDatasets/WinoG/winogrande_xl/validation-00000-of-00001.parquet
# boolq DATA=/TO/MY/PATH/MyDatasets/BoolQ/data/validation-00000-of-00001.parquet

########################calib_arc_challenge########################
# 映射：layer 30..25 <-> ratio 6.2..21.9
######################### No SFT #########################
# output base dir
# OUT_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/tools/llama2-7b-chat/boolq/
# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_arc_challenge/llama3-8b/prun/ContinuePrun-from-ShortGPT-31Layer
# PRUNED_PREFIX=Meta-Llama-3.1-8B-Instruct_shortgpt
# LAYERS=(31 30 29 28 27 26 25)
# RATIOS=(3.1 6.2 9.4 12.5 15.6 18.8 21.9)
# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_arc_challenge/llama3-8b/prun/ContinuePrun-from-ShortGPT-24Layer
# PRUNED_PREFIX=Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt
# LAYERS=(23 22 21 20 19 18)
# RATIOS=(28.1 31.2 34.4 37.5 40.6 43.8)
# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/pruned_models/shortgpt/calib_arc_challenge/llama3-8b-0.25
# PRUNED_PREFIX=Meta-Llama-3.1-8B-Instruct_shortgpt
# LAYERS=(24)
# RATIOS=(25)
# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_arc_challenge/llama3-8b/prun/ContinuePrun-from-ShortGPT-24Layer
# PRUNED_PREFIX=Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt
# LAYERS=(17 16)
# RATIOS=(46.88 50)

######################### SFT #########################
# output base dir
# OUT_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/tools/results/2_1-New-llama3-8b-instruct/sft_metric/
# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_arc_challenge/llama3-8b/finetune/from-ShortGPT-31Layer/arc_challenge
# PRUNED_PREFIX=Meta-Llama-3.1-8B-Instruct_shortgpt
# LAYERS=(31 30 29 28 27 26 25)
# RATIOS=(3.1 6.2 9.4 12.5 15.6 18.8 21.9)

# for i in "${!LAYERS[@]}"; do
#   layer="${LAYERS[$i]}"
#   ratio="${RATIOS[$i]}"
#   PRUNED="${PRUNED_BASE}/${PRUNED_PREFIX}_${layer}_bs2_lr1e-5/final"
#   OUT="${OUT_BASE}/margin_arc_challenge_ratio_${ratio}%"
#   echo "======================================================"
#   echo "[Run $((i+1))/${#LAYERS[@]}] layer=${layer}, ratio=${ratio}%"
#   echo "PRUNED=${PRUNED}"
#   echo "OUT=${OUT}"
#   echo "======================================================"
#   mkdir -p "$OUT"
#   $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
#     --dense_model "$DENSE" \
#     --pruned_model "$PRUNED" \
#     --task arc_challenge \
#     --parquet "$DATA" \
#     --split train \
#     --limit 500 \
#     --out_dir "$OUT"
# done

# OUT="${OUT_BASE}/margin_arc_challenge_ratio_25%"
# PRUNED=/TO/MY/PATH/code/Understanding_Performance_Collapse/shortgpt_outputs/calib_arcc/finetune/Llama3.1-8B-Instruct/arc_challenge/llama3-8b-0.25/Meta-Llama-3.1-8B-Instruct_shortgpt_24_bs2_newlr/final
# $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
#   --dense_model "$DENSE" \
#   --pruned_model "$PRUNED" \
#   --task arc_challenge \
#   --parquet "$DATA" \
#   --split train \
#   --limit 500 \
#   --out_dir "$OUT"


# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_arc_challenge/llama3-8b/finetune/from-ShortGPT-24Layer/arc_challenge
# PRUNED_PREFIX=Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt
# LAYERS=(23 22 21 20 19 18)
# RATIOS=(28.1 31.2 34.4 37.5 40.6 43.8)

# for i in "${!LAYERS[@]}"; do
#   layer="${LAYERS[$i]}"
#   ratio="${RATIOS[$i]}"
#   PRUNED="${PRUNED_BASE}/${PRUNED_PREFIX}_${layer}_bs2_lr1e-5_ep3/final"
#   OUT="${OUT_BASE}/margin_arc_challenge_ratio_${ratio}%"
#   echo "======================================================"
#   echo "[Run $((i+1))/${#LAYERS[@]}] layer=${layer}, ratio=${ratio}%"
#   echo "PRUNED=${PRUNED}"
#   echo "OUT=${OUT}"
#   echo "======================================================"
#   mkdir -p "$OUT"
#   $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
#     --dense_model "$DENSE" \
#     --pruned_model "$PRUNED" \
#     --task arc_challenge \
#     --parquet "$DATA" \
#     --split train \
#     --limit 500 \
#     --out_dir "$OUT"
# done


########################calib_mmlu########################
# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-24Layer
# PRUNED_PREFIX=Meta-Llama-3.1-8B-Instruct_shortgpt_24_shortgpt
# LAYERS=(23 22 21 20 19 18 17 16)
# RATIOS=(28.1 31.2 34.4 37.5 40.6 43.8 46.88 50)

# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_mmlu/llama3-8b-ContinuePrun-from-ShortGPT-31Layer
# PRUNED_PREFIX=Meta-Llama-3.1-8B-Instruct_shortgpt
# LAYERS=(31 30 29 28 27 26 25)
# RATIOS=(3.1 6.2 9.4 12.5 15.6 18.8 21.9)

# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/pruned_models/shortgpt/calib_mmlu/llama3-8b-0.25
# PRUNED_PREFIX=Meta-Llama-3.1-8B-Instruct_shortgpt
# LAYERS=(24)
# RATIOS=(25)

# for i in "${!LAYERS[@]}"; do
#   layer="${LAYERS[$i]}"
#   ratio="${RATIOS[$i]}"

#   PRUNED="${PRUNED_BASE}/${PRUNED_PREFIX}_${layer}"
#   OUT="${OUT_BASE}/margin_arc_easy_ratio_${ratio}%"

#   echo "======================================================"
#   echo "[Run $((i+1))/${#LAYERS[@]}] layer=${layer}, ratio=${ratio}%"
#   echo "PRUNED=${PRUNED}"
#   echo "OUT=${OUT}"
#   echo "======================================================"

#   mkdir -p "$OUT"

#   $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
#     --dense_model "$DENSE" \
#     --pruned_model "$PRUNED" \
#     --task arc_easy \
#     --parquet "$DATA" \
#     --split train \
#     --limit 500 \
#     --out_dir "$OUT"
# done

# echo "[Done] All sweeps finished."


#####################################删除特定的层3-7#####################################
  # Meta-Llama-3.1-8B-Instruct_manualrm_28-rm3_6
  # Meta-Llama-3.1-8B-Instruct_manualrm_28-rm4_7
  # Meta-Llama-3.1-8B-Instruct_manualrm_29-rm3_5 
  # Meta-Llama-3.1-8B-Instruct_manualrm_29-rm4_6
  # Meta-Llama-3.1-8B-Instruct_manualrm_29-rm5_7
  # Meta-Llama-3.1-8B-Instruct_manualrm_30-rm3_4
  # Meta-Llama-3.1-8B-Instruct_manualrm_30-rm4_5 
  # Meta-Llama-3.1-8B-Instruct_manualrm_30-rm5_6
  # Meta-Llama-3.1-8B-Instruct_manualrm_30-rm6_7
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm3 
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm4 
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm5 
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm6
  # Meta-Llama-3.1-8B-Instruct_manualrm_31-rm7
# PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/prun_specific_layer
# LAYERS=(
#   Meta-Llama-3.1-8B-Instruct_manualrm_28-rm3_6
#   Meta-Llama-3.1-8B-Instruct_manualrm_28-rm4_7
#   Meta-Llama-3.1-8B-Instruct_manualrm_29-rm4_6
#   Meta-Llama-3.1-8B-Instruct_manualrm_29-rm5_7
#   Meta-Llama-3.1-8B-Instruct_manualrm_30-rm5_6
# )

# for i in "${!LAYERS[@]}"; do
#   layer="${LAYERS[$i]}"
#   ratio="${RATIOS[$i]}"

#   PRUNED="${PRUNED_BASE}/${layer}/"
#   OUT="${OUT_BASE}/${layer}"

#   echo "======================================================"
#   echo "[Run $((i+1))/${#LAYERS[@]}] layer=${layer}"
#   echo "PRUNED=${PRUNED}"
#   echo "OUT=${OUT}"
#   echo "======================================================"

#   mkdir -p "$OUT"

#   $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
#     --dense_model "$DENSE" \
#     --pruned_model "$PRUNED" \
#     --task boolq \
#     --parquet "$DATA" \
#     --split train \
#     --limit 500 \
#     --out_dir "$OUT"
# done

# echo "[Done] All sweeps finished."

#####################################删除特定的层16-19#####################################
OUT_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/tools/results/2-llama3-8b-instruct/results_rmlayer17/hellaswag
PRUNED_BASE=/TO/MY/PATH/code/Understanding_Performance_Collapse/prun_specific_layer
LAYERS=(
  Meta-Llama-3.1-8B-Instruct_manualrm_31-rm15
  Meta-Llama-3.1-8B-Instruct_manualrm_31-rm16
  Meta-Llama-3.1-8B-Instruct_manualrm_31-rm17
  Meta-Llama-3.1-8B-Instruct_manualrm_31-rm18
  Meta-Llama-3.1-8B-Instruct_manualrm_30-rm15_16
  Meta-Llama-3.1-8B-Instruct_manualrm_30-rm16_17
  Meta-Llama-3.1-8B-Instruct_manualrm_30-rm17_18
)

for i in "${!LAYERS[@]}"; do
  layer="${LAYERS[$i]}"
  ratio="${RATIOS[$i]}"

  PRUNED="${PRUNED_BASE}/${layer}/"
  OUT="${OUT_BASE}/${layer}"

  echo "======================================================"
  echo "[Run $((i+1))/${#LAYERS[@]}] layer=${layer}"
  echo "PRUNED=${PRUNED}"
  echo "OUT=${OUT}"
  echo "======================================================"

  mkdir -p "$OUT"

  $PYTHON /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/per_layer_margin_eval.py \
    --dense_model "$DENSE" \
    --pruned_model "$PRUNED" \
    --task hellaswag \
    --parquet "$DATA" \
    --split train \
    --limit 500 \
    --out_dir "$OUT"
done

echo "[Done] All sweeps finished."
