#!/bin/bash

# Configuration
# Path to the original DeepSeek-V2 Lite model
MODEL_PATH="/path/to/DeepSeek-V2-Lite"

# Path to the calibration dataset (e.g., C4 JSON files or HuggingFace dataset name)
DATASET_PATH="/path/to/c4_dataset"

# Directory where the pruned model will be saved
OUTPUT_PATH="./pruned_deepseek_output"

# Pruning Parameters
RETENTION_RATIO=        # Global retention ratio (0.5 = keep 50% experts)
ALPHA=                  # Rank-aware budget sensitivity
BETA=                  # Balance factor (0.0=Novelty only, 1.0=Salience only)
PCA_RANK=               # Subspace dimension for spectral novelty
MIN_EXPERTS=              # Minimum experts to keep per layer

# System Parameters
NUM_GPUS=                 # Number of GPUs to use (DeepSeek usually requires multiple)
BATCH_SIZE=               # Batch size for calibration
NUM_SAMPLES=             # Number of sequences for calibration

# Run Pruning
python ragep_deepseek_prune.py \
    --model_path "$MODEL_PATH" \
    --dataset_path "$DATASET_PATH" \
    --output_path "$OUTPUT_PATH" \
    --global_retention_ratio $RETENTION_RATIO \
    --alpha $ALPHA \
    --beta $BETA \
    --pca_rank $PCA_RANK \
    --min_experts_per_layer $MIN_EXPERTS \
    --num_calib_samples $NUM_SAMPLES \
    --batch_size $BATCH_SIZE \
    --num_gpus $NUM_GPUS

echo "Pruning complete. Model saved to $OUTPUT_PATH"