#!/bin/bash
# =============================================================================
# Stable-QDA: Reproduce All Experiments
# =============================================================================
# 
# This script reproduces all experiments from the paper.
#
# Usage:
#   ./reproduce_all.sh           # Run all experiments
#   ./reproduce_all.sh --quick   # Quick test run
#   ./reproduce_all.sh synthetic # Run only synthetic experiments
#   ./reproduce_all.sh realworld # Run only real-world experiments
#
# Expected runtime:
#   Quick mode: ~5 minutes
#   Synthetic only: ~15 minutes
#   Real-world only: ~30 minutes
#   Full reproduction: ~1 hour
#
# =============================================================================

set -e  # Exit on error

# Configuration
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
PROJECT_ROOT="$(dirname "$SCRIPT_DIR")"
OUTPUT_DIR="${PROJECT_ROOT}/results"
DATA_DIR="${PROJECT_ROOT}/data"

# Parse arguments
QUICK=""
RUN_SYNTHETIC=true
RUN_REALWORLD=true

for arg in "$@"; do
    case $arg in
        --quick)
            QUICK="--quick"
            ;;
        synthetic)
            RUN_REALWORLD=false
            ;;
        realworld)
            RUN_SYNTHETIC=false
            ;;
    esac
done

# Header
echo "=============================================================================="
echo "STABLE-QDA: REPRODUCING PAPER EXPERIMENTS"
echo "=============================================================================="
echo ""
echo "Output directory: ${OUTPUT_DIR}"
echo "Quick mode: ${QUICK:-no}"
echo "Synthetic experiments: ${RUN_SYNTHETIC}"
echo "Real-world experiments: ${RUN_REALWORLD}"
echo ""

# Create output directory
mkdir -p "${OUTPUT_DIR}"
mkdir -p "${OUTPUT_DIR}/synthetic"
mkdir -p "${OUTPUT_DIR}/realworld"

# =============================================================================
# SYNTHETIC EXPERIMENTS
# =============================================================================

if [ "$RUN_SYNTHETIC" = true ]; then
    echo "=============================================================================="
    echo "SYNTHETIC EXPERIMENTS"
    echo "=============================================================================="
    
    cd "${PROJECT_ROOT}/experiments/synthetic"
    
    echo ""
    echo "[1/3] Experiment 1: Likelihood Benefit (Figure 1)"
    echo "----------------------------------------------------------------------"
    python exp1_likelihood_benefit.py ${QUICK} --output "${OUTPUT_DIR}/synthetic/"
    
    echo ""
    echo "[2/3] Experiment 2: Alpha Sensitivity (Figure 2)"
    echo "----------------------------------------------------------------------"
    python exp2_alpha_sensitivity.py ${QUICK} --output "${OUTPUT_DIR}/synthetic/"
    
    echo ""
    echo "[3/3] Experiment 3: Contamination Robustness (Figure 4)"
    echo "----------------------------------------------------------------------"
    python exp3_contamination.py ${QUICK} --output "${OUTPUT_DIR}/synthetic/"
    
    echo ""
    echo "Synthetic experiments complete."
    echo "Results saved to: ${OUTPUT_DIR}/synthetic/"
fi

# =============================================================================
# REAL-WORLD EXPERIMENTS
# =============================================================================

if [ "$RUN_REALWORLD" = true ]; then
    echo ""
    echo "=============================================================================="
    echo "REAL-WORLD EXPERIMENTS"
    echo "=============================================================================="
    
    cd "${PROJECT_ROOT}/experiments/realworld"
    
    # Check for data files
    echo ""
    echo "Checking for data files..."
    
    DATASETS=("htru2" "creditcard" "ionosphere" "weekly")
    MISSING=()
    
    for dataset in "${DATASETS[@]}"; do
        if [ ! -f "${DATA_DIR}/${dataset}.csv" ]; then
            MISSING+=("$dataset")
        fi
    done
    
    if [ ${#MISSING[@]} -gt 0 ]; then
        echo ""
        echo "WARNING: Missing datasets: ${MISSING[*]}"
        echo "Please download from URLs in data/README.md"
        echo ""
        echo "Running available datasets only..."
    fi
    
    for dataset in "${DATASETS[@]}"; do
        if [ -f "${DATA_DIR}/${dataset}.csv" ]; then
            echo ""
            echo "Evaluating: ${dataset}"
            echo "----------------------------------------------------------------------"
            python run_evaluation.py \
                --dataset "${dataset}" \
                --data_dir "${DATA_DIR}" \
                --output "${OUTPUT_DIR}/realworld/"
        fi
    done
    
    echo ""
    echo "Real-world experiments complete."
    echo "Results saved to: ${OUTPUT_DIR}/realworld/"
fi

# =============================================================================
# SUMMARY
# =============================================================================

echo ""
echo "=============================================================================="
echo "REPRODUCTION COMPLETE"
echo "=============================================================================="
echo ""
echo "Generated files:"
find "${OUTPUT_DIR}" -type f -name "*.csv" -o -name "*.pdf" -o -name "*.json" | head -20
echo ""
echo "See ${OUTPUT_DIR}/ for all results."
