#!/usr/bin/env bash
set -euo pipefail

ROOT="$(cd "$(dirname "$0")/.." && pwd)"

project=""
data_file=""
start_index=""
max_items=""
env_file=""

statement_max_b_retries=10
proof_max_b_retries=10
proof_max_c_replans=10
proof_max_no_progress_retries=2

semantic_check=1
semantic_check_policy="fix"

usage() {
  cat <<'EOF'
Usage:
  ./scripts/run_textbook_alternating_pipeline.sh --data-file <path> [options]

Description:
  Textbook-mode alternating pipeline (chapter/section formalization):
  statement and proof run alternately, exactly one item per stage each round.
  Internally uses:
    - scripts/run_statement_pipeline.sh
    - scripts/run_proof_pipeline.sh

Options:
  --project <name>                      Formalization project name (e.g. tao_analysis2_formal)
  --data-file <path>                    JSON data file for textbook pipeline (required)
  --start-index <n>                     Start index; default: min(statement_next, proof_next)
  --max-items <n>                       Number of alternating rounds to run
  --env-file <path>                     Pass through to statement/proof scripts

  --statement-max-b-retries <n>         Statement Agent B retries (default: 10)
  --proof-max-b-retries <n>             Proof Agent B retries (default: 10)
  --proof-max-c-replans <n>             Proof Agent C replans (default: 10)
  --proof-max-no-progress-retries <n>   Proof no-progress retries (default: 2)

  --semantic-check / --no-semantic-check
                                       Enable/disable statement semantic check (default: enabled)
  --semantic-check-policy <warn|fix|fail>
                                       Statement semantic-check policy (default: fix)

  -h, --help                            Show this help
EOF
}

infer_project_from_data_file() {
  local path="$1"
  local rel="$path"
  rel="${rel#./}"
  if [[ "$rel" = /* ]]; then
    [[ "$rel" == "$ROOT/"* ]] || return 1
    rel="${rel#$ROOT/}"
  fi
  [[ "$rel" == data/* ]] || return 1
  local rest="${rel#data/}"
  [[ "$rest" == */* ]] || return 1
  local p="${rest%%/*}"
  [[ -n "$p" ]] || return 1
  [[ "$p" != "proof" ]] || return 1
  printf '%s' "$p"
}

read_next_index() {
  local progress_file="$1"
  python3 - "$progress_file" <<'PY'
import json
import sys
from pathlib import Path

p = Path(sys.argv[1])
if not p.exists():
    print(1)
    raise SystemExit(0)
try:
    obj = json.loads(p.read_text(encoding="utf-8"))
    n = int(obj.get("next_index", 1))
    print(n if n > 0 else 1)
except Exception:
    print(1)
PY
}

while [[ $# -gt 0 ]]; do
  case "$1" in
    --project)
      project="${2:-}"
      shift 2
      ;;
    --project=*)
      project="${1#--project=}"
      shift
      ;;
    --data-file)
      data_file="${2:-}"
      shift 2
      ;;
    --data-file=*)
      data_file="${1#--data-file=}"
      shift
      ;;
    --start-index)
      start_index="${2:-}"
      shift 2
      ;;
    --start-index=*)
      start_index="${1#--start-index=}"
      shift
      ;;
    --max-items)
      max_items="${2:-}"
      shift 2
      ;;
    --max-items=*)
      max_items="${1#--max-items=}"
      shift
      ;;
    --env-file)
      env_file="${2:-}"
      shift 2
      ;;
    --env-file=*)
      env_file="${1#--env-file=}"
      shift
      ;;
    --statement-max-b-retries)
      statement_max_b_retries="${2:-}"
      shift 2
      ;;
    --statement-max-b-retries=*)
      statement_max_b_retries="${1#--statement-max-b-retries=}"
      shift
      ;;
    --proof-max-b-retries)
      proof_max_b_retries="${2:-}"
      shift 2
      ;;
    --proof-max-b-retries=*)
      proof_max_b_retries="${1#--proof-max-b-retries=}"
      shift
      ;;
    --proof-max-c-replans)
      proof_max_c_replans="${2:-}"
      shift 2
      ;;
    --proof-max-c-replans=*)
      proof_max_c_replans="${1#--proof-max-c-replans=}"
      shift
      ;;
    --proof-max-no-progress-retries)
      proof_max_no_progress_retries="${2:-}"
      shift 2
      ;;
    --proof-max-no-progress-retries=*)
      proof_max_no_progress_retries="${1#--proof-max-no-progress-retries=}"
      shift
      ;;
    --semantic-check)
      semantic_check=1
      shift
      ;;
    --no-semantic-check)
      semantic_check=0
      shift
      ;;
    --semantic-check-policy)
      semantic_check_policy="${2:-}"
      shift 2
      ;;
    --semantic-check-policy=*)
      semantic_check_policy="${1#--semantic-check-policy=}"
      shift
      ;;
    -h|--help)
      usage
      exit 0
      ;;
    *)
      echo "Unknown argument: $1" >&2
      usage
      exit 2
      ;;
  esac
done

if [[ -z "$data_file" ]]; then
  echo "Missing --data-file" >&2
  usage
  exit 2
fi

if [[ ! -f "$data_file" ]]; then
  echo "Data file not found: $data_file" >&2
  exit 2
fi

if [[ -z "$project" ]]; then
  project="$(infer_project_from_data_file "$data_file")" || true
fi

if [[ -z "$project" ]]; then
  echo "Unable to infer --project from --data-file. Please set --project explicitly." >&2
  exit 2
fi

stmt_progress="$ROOT/log/$project/statement_logs/statement_progress.json"
proof_progress="$ROOT/log/$project/proof_logs/proof_progress.json"

stmt_next="$(read_next_index "$stmt_progress")"
proof_next="$(read_next_index "$proof_progress")"

if [[ -n "$start_index" ]]; then
  current_index="$start_index"
else
  if (( stmt_next <= proof_next )); then
    current_index="$stmt_next"
  else
    current_index="$proof_next"
  fi
fi

force_stmt_from_cli=0
force_proof_from_cli=0
if [[ -n "$start_index" ]]; then
  # CLI start-index has higher priority than progress files.
  force_stmt_from_cli=1
  force_proof_from_cli=1
fi

round=0
while :; do
  if [[ -n "$max_items" ]] && (( round >= max_items )); then
    echo "Reached max-items=$max_items, stopping."
    break
  fi

  round=$((round + 1))
  echo
  echo "========== [round $round index $current_index] statement =========="

  stmt_next_before="$(read_next_index "$stmt_progress")"
  statement_ran=0
  if (( force_stmt_from_cli == 1 || stmt_next_before <= current_index )); then
    statement_ran=1
    stmt_cmd=(
      bash "$ROOT/scripts/run_statement_pipeline.sh"
      --project "$project"
      --data-file "$data_file"
      --start-index "$current_index"
      --max-items 1
      --max-b-retries "$statement_max_b_retries"
    )
    if [[ -n "$env_file" ]]; then
      stmt_cmd+=(--env-file "$env_file")
    fi
    if [[ "$semantic_check" -eq 1 ]]; then
      stmt_cmd+=(--semantic-check --semantic-check-policy "$semantic_check_policy")
    else
      stmt_cmd+=(--no-semantic-check)
    fi
    "${stmt_cmd[@]}"
    force_stmt_from_cli=0
  else
    echo "Statement already ahead (next_index=$stmt_next_before), skip index $current_index."
  fi

  stmt_next_after="$(read_next_index "$stmt_progress")"
  if (( stmt_next_after <= current_index )); then
    echo "Statement did not advance beyond index $current_index (next_index=$stmt_next_after). Stop." >&2
    exit 1
  fi

  proof_target_index="$current_index"
  if (( statement_ran == 1 )); then
    proof_target_index=$((stmt_next_after - 1))
  fi

  echo
  echo "========== [round $round index $proof_target_index] proof =========="

  proof_next_before="$(read_next_index "$proof_progress")"
  if (( force_proof_from_cli == 1 || proof_next_before <= proof_target_index )); then
    proof_cmd=(
      bash "$ROOT/scripts/run_proof_pipeline.sh"
      --project "$project"
      --data-file "$data_file"
      --start-index "$proof_target_index"
      --max-items 1
      --max-b-retries "$proof_max_b_retries"
      --max-c-replans "$proof_max_c_replans"
      --max-no-progress-retries "$proof_max_no_progress_retries"
    )
    if [[ -n "$env_file" ]]; then
      proof_cmd+=(--env-file "$env_file")
    fi
    "${proof_cmd[@]}"
    force_proof_from_cli=0
  else
    echo "Proof already ahead (next_index=$proof_next_before), skip index $proof_target_index."
  fi

  proof_next_after="$(read_next_index "$proof_progress")"
  if (( proof_next_after <= proof_target_index )); then
    echo "Proof did not advance beyond index $proof_target_index (next_index=$proof_next_after). Stop." >&2
    exit 1
  fi

  if (( stmt_next_after <= proof_next_after )); then
    next_index="$stmt_next_after"
  else
    next_index="$proof_next_after"
  fi

  if (( next_index <= current_index )); then
    echo "No forward progress (current=$current_index, next=$next_index). Stop." >&2
    exit 1
  fi

  echo "Round $round done. Statement next=$stmt_next_after, proof next=$proof_next_after, next round index=$next_index."
  current_index="$next_index"
done

echo
echo "Completed textbook alternating run for $round round(s)."
