#!/usr/bin/env bash
set -euo pipefail

ROOT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
OUT_DIR="${ROOT_DIR}/outputs/smoke"
mkdir -p "${OUT_DIR}"
unset PYTHONPATH
export PYTHONNOUSERSITE=1

python -m py_compile "${ROOT_DIR}"/src/*.py

python "${ROOT_DIR}/src/teacher_translate.py" \
  --input "${ROOT_DIR}/dataset/sampled_train/grpo_train_sample.jsonl" \
  --output "${OUT_DIR}/teacher_statement_prompt_preview.jsonl" \
  --stage statement \
  --limit 3 \
  --dry_run

python "${ROOT_DIR}/src/teacher_translate.py" \
  --input "${ROOT_DIR}/dataset/sampled_train/grpo_train_sample.jsonl" \
  --output "${OUT_DIR}/teacher_theory_prompt_preview.jsonl" \
  --stage theory \
  --limit 3 \
  --dry_run

python "${ROOT_DIR}/src/grpo_mvp.py" order \
  --input "${ROOT_DIR}/dataset/sampled_train/grpo_train_sample.jsonl" \
  --output "${OUT_DIR}/grpo_train_sample_difficulty_ordered.jsonl"

python "${ROOT_DIR}/src/train_grpo_mvp.py" prepare \
  --train_jsonl "${ROOT_DIR}/dataset/sampled_train/grpo_train_sample.jsonl" \
  --output "${OUT_DIR}/grpo_prompt_preview.jsonl" \
  --difficulty_order \
  --limit 3

python "${ROOT_DIR}/src/train_grpo_mvp.py" reward-smoke

echo "Smoke pipeline completed. Outputs: ${OUT_DIR}"
