#!/bin/bash
#SBATCH --job-name=shortgpt_prun_qwen3-4b-instruct
#SBATCH --partition=lvjq
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=3
#SBATCH --gres=gpu:1
#SBATCH -o %J.out
#SBATCH -e %J.err

module load anaconda3
source activate come

PYTHON=~/.conda/envs/come/bin/python

MODEL_PATH=/TO/MY/PATH/ckpt/Qwen3-4B-Instruct-2507-modelscope
# /TO/MY/PATH/ckpt/llama2-7b-chat-hf
# /TO/MY/PATH/ckpt/qwen3-4b
# /seu_nvme/ogai/models/Llama-2-7b-hf
# /seu_nvme/ogai/models/Meta-Llama-3.1-8B-Instruct
MAIN_PY=/TO/MY/PATH/code/Understanding_Performance_Collapse/main.py
SAVE_ROOT=/TO/MY/PATH/code/Understanding_Performance_Collapse/pruned_models/qwen3-4b-instruct/shortgpt/arc_challenge

TOTAL_LAYERS=36
for TL in $(seq 16 35); do
  PRUNE_RATIO=$($PYTHON - <<PY
tl=${TL}
T=${TOTAL_LAYERS}
r=(T - tl) / T
# mimic your style: keep 3 decimals, strip trailing zeros (0.250 -> 0.25)
s=f"{r:.3f}".rstrip('0').rstrip('.')
print(s)
PY
)

  SUBDIR="qwen3-4b-instruct-${PRUNE_RATIO}"
  OUTDIR="${SAVE_ROOT}/${SUBDIR}"
  mkdir -p "${OUTDIR}"

  echo "==== Run target_layers=${TL}, prune_ratio=${PRUNE_RATIO}, out=${OUTDIR} ===="

  $PYTHON ${MAIN_PY} --method shortgpt \
    --model-name ${MODEL_PATH} \
    --target-layers ${TL} \
    --save-path ${OUTDIR} \
    --calibration-dataset arc_challenge \
    --nsamples 256
    # --iterative_depth
done
