#!/usr/bin/env bash
set -euo pipefail

ROOT="$(cd "$(dirname "$0")/.." && pwd)"

project="P2512_19197"
data_file=""
task_id=""
start_index=""
max_items=""
statement_stage="statement"
proof_stage="proof"

statement_max_b_retries=10
proof_max_b_retries=10
proof_max_c_replans=10
proof_max_no_progress_retries=2
semantic_check=1
semantic_check_policy="fix"

usage() {
  cat <<'EOF'
Usage:
  ./scripts/run_item_alternating_pipeline.sh --data-file <path> [options]

Description:
  Alternate per item: run statement first, then proof for the same label.
  Items are ordered by `index` in the input JSON (fallback: position+1).

Options:
  --project <name>                      Lean subdir under M2F/ (default: P2512_19197)
  --data-file <path>                    JSON list file (required)
  --task-id <id>                        Task id for log partitioning (default: data file stem)
  --start-index <n>                     Start from item index >= n
  --max-items <n>                       Process at most n items
  --statement-stage <name>              Statement stage (default: statement)
  --proof-stage <name>                  Proof stage (default: proof)
  --statement-max-b-retries <n>         Statement Agent B retries (default: 10)
  --proof-max-b-retries <n>             Proof Agent B retries (default: 10)
  --proof-max-c-replans <n>             Proof Agent C replans (default: 10)
  --proof-max-no-progress-retries <n>   Proof no-progress retries (default: 2)
  --semantic-check / --no-semantic-check
                                       Enable/disable statement semantic check (default: enabled)
  --semantic-check-policy <warn|fix|fail>
                                       Statement semantic-check policy (default: fix)
  -h, --help                            Show this help
EOF
}

while [[ $# -gt 0 ]]; do
  case "$1" in
    --project)
      project="${2:-}"
      shift 2
      ;;
    --project=*)
      project="${1#--project=}"
      shift
      ;;
    --data-file)
      data_file="${2:-}"
      shift 2
      ;;
    --data-file=*)
      data_file="${1#--data-file=}"
      shift
      ;;
    --task-id)
      task_id="${2:-}"
      shift 2
      ;;
    --task-id=*)
      task_id="${1#--task-id=}"
      shift
      ;;
    --start-index)
      start_index="${2:-}"
      shift 2
      ;;
    --start-index=*)
      start_index="${1#--start-index=}"
      shift
      ;;
    --max-items)
      max_items="${2:-}"
      shift 2
      ;;
    --max-items=*)
      max_items="${1#--max-items=}"
      shift
      ;;
    --statement-stage)
      statement_stage="${2:-}"
      shift 2
      ;;
    --statement-stage=*)
      statement_stage="${1#--statement-stage=}"
      shift
      ;;
    --proof-stage)
      proof_stage="${2:-}"
      shift 2
      ;;
    --proof-stage=*)
      proof_stage="${1#--proof-stage=}"
      shift
      ;;
    --statement-max-b-retries)
      statement_max_b_retries="${2:-}"
      shift 2
      ;;
    --statement-max-b-retries=*)
      statement_max_b_retries="${1#--statement-max-b-retries=}"
      shift
      ;;
    --proof-max-b-retries)
      proof_max_b_retries="${2:-}"
      shift 2
      ;;
    --proof-max-b-retries=*)
      proof_max_b_retries="${1#--proof-max-b-retries=}"
      shift
      ;;
    --proof-max-c-replans)
      proof_max_c_replans="${2:-}"
      shift 2
      ;;
    --proof-max-c-replans=*)
      proof_max_c_replans="${1#--proof-max-c-replans=}"
      shift
      ;;
    --proof-max-no-progress-retries)
      proof_max_no_progress_retries="${2:-}"
      shift 2
      ;;
    --proof-max-no-progress-retries=*)
      proof_max_no_progress_retries="${1#--proof-max-no-progress-retries=}"
      shift
      ;;
    --semantic-check)
      semantic_check=1
      shift
      ;;
    --no-semantic-check)
      semantic_check=0
      shift
      ;;
    --semantic-check-policy)
      semantic_check_policy="${2:-}"
      shift 2
      ;;
    --semantic-check-policy=*)
      semantic_check_policy="${1#--semantic-check-policy=}"
      shift
      ;;
    -h | --help)
      usage
      exit 0
      ;;
    *)
      echo "Unknown argument: $1" >&2
      usage
      exit 2
      ;;
  esac
done

if [[ -z "$data_file" ]]; then
  echo "Missing --data-file" >&2
  usage
  exit 2
fi

if [[ ! -f "$data_file" ]]; then
  echo "Data file not found: $data_file" >&2
  exit 2
fi

if [[ -z "$task_id" ]]; then
  base="$(basename "$data_file")"
  task_id="${base%.json}"
fi

mkdir -p "$ROOT/M2F/$project"

start_arg="${start_index:-}"
max_arg="${max_items:-}"
mapfile -t rows < <(
  python3 - "$data_file" "$start_arg" "$max_arg" <<'PY'
import json
import sys
from pathlib import Path

data_path = Path(sys.argv[1])
start = int(sys.argv[2]) if sys.argv[2] else None
limit = int(sys.argv[3]) if sys.argv[3] else None

raw = json.loads(data_path.read_text(encoding="utf-8"))
if not isinstance(raw, list):
    raise SystemExit(f"Expected JSON list at {data_path}")

items = []
for pos, entry in enumerate(raw):
    if not isinstance(entry, dict):
        continue
    label = entry.get("label")
    if not isinstance(label, str) or not label.strip():
        continue
    idx = entry.get("index")
    if not isinstance(idx, int):
        idx = pos + 1
    items.append((int(idx), label.strip()))

items.sort(key=lambda x: x[0])
if start is not None:
    items = [x for x in items if x[0] >= start]
if limit is not None:
    items = items[:limit]

for idx, label in items:
    print(f"{idx}\t{label}")
PY
)

if [[ ${#rows[@]} -eq 0 ]]; then
  echo "No items selected from: $data_file" >&2
  exit 1
fi

for row in "${rows[@]}"; do
  idx="${row%%$'\t'*}"
  label="${row#*$'\t'}"

  echo
  echo "=== [item index=$idx label=$label] statement ==="
  stmt_cmd=(
    bash "$ROOT/scripts/run_item_statement_pipeline.sh"
    --project "$project"
    --data-file "$data_file"
    --task-id "$task_id"
    --stage "$statement_stage"
    --only-label "$label"
    --start-index "$idx"
    --max-b-retries "$statement_max_b_retries"
  )
  if [[ "$semantic_check" -eq 1 ]]; then
    stmt_cmd+=(--semantic-check --semantic-check-policy "$semantic_check_policy")
  else
    stmt_cmd+=(--no-semantic-check)
  fi
  "${stmt_cmd[@]}"

  echo
  echo "=== [item index=$idx label=$label] proof ==="
  bash "$ROOT/scripts/run_item_proof_pipeline.sh" \
    --project "$project" \
    --data-file "$data_file" \
    --task-id "$task_id" \
    --stage "$proof_stage" \
    --only-label "$label" \
    --start-index "$idx" \
    --max-b-retries "$proof_max_b_retries" \
    --max-c-replans "$proof_max_c_replans" \
    --max-no-progress-retries "$proof_max_no_progress_retries"
done

echo
echo "Completed alternating statement->proof for ${#rows[@]} item(s)."
