{
  "$schema": "https://json-schema.org/draft/2020-12/schema",
  "$id": "https://leanresearch.local/schemas/pilot_pairs.schema.json",
  "title": "LeanResearch Pilot Pair",
  "description": "Single proof-step sample for tactic-family prediction.",
  "type": "object",
  "required": [
    "file",
    "theorem",
    "step_index",
    "main_goal",
    "local_context",
    "next_tactic",
    "tactic_family"
  ],
  "additionalProperties": false,
  "properties": {
    "file": {
      "type": "string",
      "description": "Workspace-relative Lean source path."
    },
    "theorem": {
      "type": "string",
      "description": "Name of the theorem currently being proved."
    },
    "step_index": {
      "type": "integer",
      "minimum": 0,
      "description": "0-based index inside a theorem proof script."
    },
    "main_goal": {
      "type": "string",
      "description": "Pretty-printed current main goal before applying next_tactic."
    },
    "local_context": {
      "type": "array",
      "description": "Ordered list of local hypotheses in pretty-printed form.",
      "items": {
        "type": "string"
      }
    },
    "next_tactic": {
      "type": "string",
      "description": "Original Lean tactic text for this step."
    },
    "tactic_family": {
      "type": "string",
      "enum": [
        "apply",
        "assumption",
        "by_contra",
        "cases",
        "constructor",
        "contradiction",
        "exact",
        "exact_mod_cast",
        "grind",
        "have",
        "intro",
        "left",
        "linarith",
        "obtain",
        "refine",
        "rfl",
        "right",
        "ring",
        "rintro",
        "rw",
        "simp",
        "simp_all",
        "simp_rw",
        "term"
      ],
      "description": "Normalized head-tactic family label."
    },
    "state_before": {
      "type": "string",
      "description": "Optional full pretty-printed Lean state before next_tactic."
    },
    "state_after": {
      "type": "string",
      "description": "Optional full pretty-printed Lean state after next_tactic."
    },
    "annotated_tactic": {
      "type": ["string", "null"],
      "description": "Optional LeanDojo tactic text with premise annotations."
    },
    "premises": {
      "type": "array",
      "description": "Optional LeanDojo premise provenance objects used by the tactic.",
      "items": {
        "type": "object",
        "additionalProperties": true
      }
    },
    "ast_summary": {
      "type": "object",
      "description": "Optional lightweight AST metadata used by syntax-aware representations.",
      "additionalProperties": true
    },
    "source": {
      "type": "string",
      "description": "Optional data source tag such as pilot or leandojo."
    },
    "trace_id": {
      "type": "string",
      "description": "Optional stable trace identifier."
    },
    "theorem_statement": {
      "type": "string",
      "description": "Optional theorem statement text."
    }
  }
}
