#!/bin/bash
# Overnight experiment runner - keeps all 4 GPUs busy (~2 hours)
# Run with: ./run_overnight.sh 2>&1 | tee overnight_$(date +%Y%m%d_%H%M%S).log

set -e
cd "$(dirname "$0")"
source .venv/bin/activate

LOG_DIR="logs/overnight_$(date +%Y%m%d_%H%M%S)"
mkdir -p "$LOG_DIR"

echo "=============================================="
echo "Overnight Experiment Runner"
echo "Started: $(date)"
echo "Log directory: $LOG_DIR"
echo "=============================================="

# Helper function to run a job and log output
run_job() {
    local name="$1"
    local gpus="$2"
    shift 2
    local cmd="$@"

    echo "[$(date +%H:%M:%S)] Starting: $name (GPUs: $gpus)"
    if [ -z "$gpus" ]; then
        $cmd > "$LOG_DIR/${name}.log" 2>&1
    else
        CUDA_VISIBLE_DEVICES=$gpus $cmd > "$LOG_DIR/${name}.log" 2>&1
    fi
    local status=$?
    if [ $status -eq 0 ]; then
        echo "[$(date +%H:%M:%S)] Completed: $name"
    else
        echo "[$(date +%H:%M:%S)] FAILED: $name (exit code $status)"
    fi
    return $status
}

# ============================================
# PHASE 1: Experiment 3 - Old OTD Ablation (highest priority)
# Run 2 ablation jobs in parallel (each needs 2 GPUs for 70B)
# ============================================
echo ""
echo "=== PHASE 1: Experiment 3 Ablation (Old OTD) ==="

# First batch: 2 parallel jobs
run_job "exp3_165832" "0,1" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_165832_layer33_repro.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID1=$!

run_job "exp3_184422" "2,3" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_184422.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID2=$!

wait $PID1 $PID2

# Second batch
run_job "exp3_184533" "0,1" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_184533.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID1=$!

run_job "exp3_204005" "2,3" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_204005.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID2=$!

wait $PID1 $PID2

# Third batch
run_job "exp3_103648" "0,1" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260128_103648_extra_2_features.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID1=$!

run_job "exp3_overlapping" "2,3" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_overlapping_features.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID2=$!

wait $PID1 $PID2

# Fourth batch (fresh_prompts files)
run_job "exp3_105227_fresh" "0,1" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260128_105227_fresh_prompts_20.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID1=$!

run_job "exp3_111339_fresh" "2,3" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260128_111339_fresh_prompts_20.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID2=$!

wait $PID1 $PID2

# Fifth batch
run_job "exp3_115234_fresh" "0,1" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260128_115234_fresh_prompts_20.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID1=$!

run_job "exp3_115253_fresh" "2,3" .venv/bin/python experiment_3_off_topic_detectors/experiment_3_with_ablation.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260128_115253_fresh_prompts_20.json \
    --ablate data/off_topic_detectors_old.json --judge haiku &
PID2=$!

wait $PID1 $PID2

echo "=== Experiment 3 Complete ==="

# ============================================
# PHASE 2: Experiment 10 + Experiment 4 remaining
# ============================================
echo ""
echo "=== PHASE 2: Experiment 10 (Random Latent) + Experiment 4 (Finetuning) ==="

# Run Exp 4 remaining percentages
run_job "exp4_70pct" "0" ./experiment_4_finetuning/run_esr.sh --pct 70 --judge haiku --gpu 0 &
PID1=$!

run_job "exp4_80pct" "1" ./experiment_4_finetuning/run_esr.sh --pct 80 --judge haiku --gpu 0 &
PID2=$!

wait $PID1 $PID2

# Exp 10 random ablation + Exp 4 90pct + Exp 7 (no GPU)
run_job "exp10_random" "0,1" .venv/bin/python experiment_10_random_latent_control/run_random_latent_control.py run-random \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_204005.json \
    --n-sets 3 --judge haiku &
PID1=$!

run_job "exp4_90pct" "2" ./experiment_4_finetuning/run_esr.sh --pct 90 --judge haiku --gpu 0 &
PID2=$!

run_job "exp7_cross_judge" "" .venv/bin/python experiment_7_cross_judge/run_cross_judge.py --n-samples 1000 &
PID3=$!

wait $PID1 $PID2 $PID3

# Analyze exp 10 (no GPU)
run_job "exp10_analyze" "" .venv/bin/python experiment_10_random_latent_control/run_random_latent_control.py analyze

echo "=== Experiment 10 + 4 Complete ==="

# ============================================
# PHASE 3: Experiment 6 + Experiment 9
# ============================================
echo ""
echo "=== PHASE 3: Experiment 6 (Sequential) + Experiment 9 (Activation Stats) ==="

run_job "exp6_sequential" "0,1" .venv/bin/python experiment_6_sequential_activations.py &
PID1=$!

run_job "exp9_collect" "2,3" .venv/bin/python experiment_9_activation_stats/run_activation_stats.py collect-activations &
PID2=$!

wait $PID1 $PID2

run_job "exp9_baseline" "0,1" .venv/bin/python experiment_9_activation_stats/run_activation_stats.py collect-baseline

# Analyze (no GPU)
run_job "exp9_analyze" "" .venv/bin/python experiment_9_activation_stats/run_activation_stats.py analyze
run_job "exp9_output" "" .venv/bin/python experiment_9_activation_stats/run_activation_stats.py generate-output

echo "=== Experiment 6 + 9 Complete ==="

# ============================================
# PHASE 4: Experiment 8 - No-Steering Baseline
# ============================================
echo ""
echo "=== PHASE 4: Experiment 8 (No-Steering Baseline) ==="

# Gemma models
run_job "exp8_gemma2b" "0" ./python_for_gemma.sh experiment_8_no_steering_baseline.py gemma-2-2b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_gemma-2-2b-it-res-16k-layer-16_20260127_220715.json \
    --judge haiku &
PID1=$!

run_job "exp8_gemma9b" "1" ./python_for_gemma.sh experiment_8_no_steering_baseline.py gemma-2-9b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_gemma-2-9b-res-16k-layer-26_20260127_222911.json \
    --judge haiku &
PID2=$!

run_job "exp8_gemma27b" "2,3" ./python_for_gemma.sh experiment_8_no_steering_baseline.py gemma-2-27b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_gemma-2-27b-it-res-131k-layer-22_20260127_222339.json \
    --judge haiku &
PID3=$!

wait $PID1 $PID2 $PID3

# Llama models
run_job "exp8_llama8b" "0" .venv/bin/python experiment_8_no_steering_baseline.py 8b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.1-8B-Instruct_20260127_225239.json \
    --judge haiku &
PID1=$!

run_job "exp8_llama70b" "1,2,3" .venv/bin/python experiment_8_no_steering_baseline.py 70b \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_204005.json \
    --judge haiku &
PID2=$!

wait $PID1 $PID2

echo "=== Experiment 8 Complete ==="

# ============================================
# PHASE 5: Experiment 5 - Prompt Variants (if time permits)
# ============================================
echo ""
echo "=== PHASE 5: Experiment 5 (Prompt Variants) ==="

# Llama 70B prompt variants (2 GPUs each, run 2 in parallel)
run_job "exp5_70b_165832" "0,1" .venv/bin/python experiment_5_prompt_variants.py \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_165832_layer33_repro.json \
    --override-judge-model haiku --variants all &
PID1=$!

run_job "exp5_70b_184422" "2,3" .venv/bin/python experiment_5_prompt_variants.py \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_184422.json \
    --override-judge-model haiku --variants all &
PID2=$!

wait $PID1 $PID2

run_job "exp5_70b_184533" "0,1" .venv/bin/python experiment_5_prompt_variants.py \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_184533.json \
    --override-judge-model haiku --variants all &
PID1=$!

run_job "exp5_70b_204005" "2,3" .venv/bin/python experiment_5_prompt_variants.py \
    --from-results experiment_results/claude_haiku_4_5_20251001_judge/experiment_results_Meta-Llama-3.3-70B-Instruct_20260127_204005.json \
    --override-judge-model haiku --variants all &
PID2=$!

wait $PID1 $PID2

echo "=== Experiment 5 (partial) Complete ==="

# ============================================
# FINAL: Generate plots
# ============================================
echo ""
echo "=== Generating Plots ==="
run_job "plots" "" .venv/bin/python plotting/plot_all.py

echo ""
echo "=============================================="
echo "Overnight run complete!"
echo "Finished: $(date)"
echo "Check $LOG_DIR for individual job logs"
echo "=============================================="
