#!/usr/bin/env bash
set -euo pipefail

DATA="${DATA:-data/mathlib_subset_s4_steps_checked.jsonl}"
SEEDS="${SEEDS:-0,1,2,3,4,42}"
WEIGHTS="${WEIGHTS:-0,0.001,0.002,0.005,0.01,0.02,0.05,0.1,0.2,0.5,1,2}"
REPS="${REPS:-state_only,state_meta,retrieved_premise,oracle_premise}"

python -m unittest discover -s tests

python scripts/analyze_dataset.py \
  --data "$DATA" \
  --output-json results/dataset/s4_state_only_summary.json \
  --summary-csv results/tables/s4_dataset_summary.csv \
  --label-csv results/tables/s4_label_distribution.csv

python scripts/run_experiments.py \
  --data "$DATA" \
  --representations "$REPS" \
  --table-output results/tables/s4_classification_summary.csv

python scripts/run_multiseed.py \
  --data "$DATA" \
  --representations "$REPS" \
  --seeds "$SEEDS" \
  --table-output results/tables/s4_classification_multiseed.csv \
  --aggregate-output results/tables/s4_classification_aggregate.csv

python scripts/run_file_split.py \
  --data "$DATA" \
  --representations state_only,state_meta,retrieved_premise \
  --group-field file \
  --table-output results/tables/s4_file_split_classification_summary.csv

for seed in ${SEEDS//,/ }; do
  python scripts/run_search.py \
    --data "$DATA" \
    --strategy unguided,family_guided,family_soft,family_top_m,family_rrf,oracle_family \
    --representation state_only \
    --seed "$seed" \
    --family-weights "$WEIGHTS" \
    --use-validation \
    --table-output "results/tables/s4_search_validation_seed${seed}.csv"
done

python scripts/analyze_duplicates.py \
  --data "$DATA" \
  --summary-output results/tables/s4_duplicate_summary.csv \
  --examples-output results/tables/s4_duplicate_examples.csv

python scripts/analyze_family_groups.py \
  --data "$DATA" \
  --representation state_only \
  --model tfidf_linear_svm \
  --family-output results/tables/s4_per_family_f1.csv \
  --group-output results/tables/s4_grouped_family_f1.csv

python scripts/run_confidence_analysis.py \
  --data "$DATA" \
  --representation state_only \
  --family-model logistic_regression \
  --family-weight 0.25 \
  --output results/tables/s4_confidence_exposure.csv

python scripts/run_lean_execution.py \
  --data "$DATA" \
  --strategy unguided,family_guided,family_soft,family_top_m,family_rrf \
  --representation state_only \
  --seed 42 \
  --sample-size 500 \
  --max-k 5 \
  --cache-output results/execution/s4_state_only_execution_queue.jsonl \
  --summary-output results/tables/s4_state_only_execution_queue_summary.jsonl

echo "Queued Lean execution records. Add --execute --repo <repo-url-or-path> --commit <commit> after verifying LeanDojo repo settings."
