#!/bin/bash

# Configuration
# Path to the original Qwen-MoE model
MODEL_PATH="/path/to/Qwen3"

# Path to the calibration dataset (e.g., C4 JSON files or HuggingFace dataset name)
DATASET_PATH="/path/to/c4_dataset"

# Directory where the pruned model will be saved
OUTPUT_PATH="./pruned_model_output"

# Pruning Parameters
RETENTION_RATIO=       # Percentage of experts to keep globally
ALPHA=                # Sensitivity for rank-aware budget allocation
BETA=                   # Balance factor (0.0=Novelty only, 1.0=Salience only)
PCA_RANK=                # Dimension for subspace analysis
MIN_EXPERTS=             # Minimum experts to keep per layer

# Calibration Parameters
NUM_SAMPLES=             # Number of sequences for calibration
BLOCK_SIZE=            # Sequence length
BATCH_SIZE=               # Batch size for forward pass

# Run Pruning
python ragep_qwen_prune.py \
    --model_path "$MODEL_PATH" \
    --dataset_path "$DATASET_PATH" \
    --output_path "$OUTPUT_PATH" \
    --retention_ratio $RETENTION_RATIO \
    --alpha $ALPHA \
    --beta $BETA \
    --pca_rank $PCA_RANK \
    --min_experts_per_layer $MIN_EXPERTS \
    --num_calib_samples $NUM_SAMPLES \
    --block_size $BLOCK_SIZE \
    --batch_size $BATCH_SIZE

echo "Pruning complete. Model saved to $OUTPUT_PATH"