#!/bin/bash
#
# Quick Start Script for Hyperfitting Analysis
#
# This script runs the full experimental pipeline:
# 1. Hyperfits a TinyLlama model (fastest to test)
# 2. Runs all 4 experiments
#
# Usage:
#   ./scripts/run_full_pipeline.sh
#
# For 4090 GPU, TinyLlama takes ~1-2 hours to hyperfit
#

set -e

echo "============================================================"
echo "HYPERFITTING ANALYSIS - FULL PIPELINE"
echo "============================================================"

# Configuration
MODEL="TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T"
SAVE_DIR="./checkpoints/hyperfitted_tinyllama"
RESULTS_DIR="./results"
DTYPE="bfloat16"

# Create directories
mkdir -p $SAVE_DIR
mkdir -p $RESULTS_DIR

# Step 1: Hyperfit the model
echo ""
echo "============================================================"
echo "STEP 1: HYPERFITTING ${MODEL}"
echo "============================================================"
echo ""

python src/run_experiments.py \
    --mode hyperfit \
    --model $MODEL \
    --num_samples 2000 \
    --sequence_length 256 \
    --num_epochs 20 \
    --learning_rate 1e-6 \
    --batch_size 8 \
    --save_dir $SAVE_DIR \
    --torch_dtype $DTYPE

# Step 2: Run all experiments
echo ""
echo "============================================================"
echo "STEP 2: RUNNING ALL EXPERIMENTS"
echo "============================================================"
echo ""

python src/run_experiments.py \
    --mode experiments \
    --original_model $MODEL \
    --hyperfitted_model ${SAVE_DIR}/final \
    --num_eval_samples 100 \
    --output_dir $RESULTS_DIR \
    --torch_dtype $DTYPE

echo ""
echo "============================================================"
echo "PIPELINE COMPLETE"
echo "============================================================"
echo "Results saved to: $RESULTS_DIR"
echo ""
