#!/bin/bash
#SBATCH --job-name=trace_cka
#SBATCH --partition=lvjq
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=3
#SBATCH --gres=gpu:1
#SBATCH -o %J.out
#SBATCH -e %J.err

module load anaconda3
source activate come

export CUDA_HOME=/usr/local/cuda
export PATH=$CUDA_HOME/bin:$PATH
export LD_LIBRARY_PATH=$CUDA_HOME/lib64:$LD_LIBRARY_PATH

PYTHON=~/.conda/envs/come/bin/python

${PYTHON} /TO/MY/PATH/code/Understanding_Performance_Collapse/TALE/layerwise_cka_align.py \
  --dense_model /TO/MY/PATH/ckpt/Qwen3-4B-Instruct-2507-modelscope \
  --pruned_model /TO/MY/PATH/code/Understanding_Performance_Collapse/iter_shortgpt_output/calib_arc_challenge/qwen3-4b-instruct/prun/ContinuePrun-from-ShortGPT-31Layer/Qwen3-4B-Instruct-2507-modelscope_shortgpt_18 \
  --output_dir /TO/MY/PATH/code/Understanding_Performance_Collapse/tools/results/1-qwen3-4b-instruct/results_cka/arc_easy \
  --sft_dataset arc_easy \
  --eval_split validation \
  --max_length 512 \
  --num_eval_samples 500 \
  --pool mean \
  --max_prompt_tokens 512 \
  --dtype bf16
