"""DeepSeek client + JSON parsing for LLM-judge validation.

Imports `DeepSeekClient` and `with_retry` from an external `clients.py`
module. Set the `EXTERNAL_CLIENTS_DIR` environment variable to a directory
containing that module if you intend to run the LLM-judge validation
pipeline. Not required for reproducing the headline pass@k results; this
shim is only used by analysis/exploration/llm_validation/ workflows.
"""
from __future__ import annotations

import json
import os
import re
import sys
from pathlib import Path

_EXTERNAL_SRC = Path(os.environ.get("EXTERNAL_CLIENTS_DIR", ""))
if _EXTERNAL_SRC and _EXTERNAL_SRC.is_dir() and str(_EXTERNAL_SRC) not in sys.path:
    sys.path.insert(0, str(_EXTERNAL_SRC))

from clients import DeepSeekClient, with_retry  # noqa: E402

# 9-class taxonomy (v4): added SETUP for input/format comprehension to
# resolve the persistent PLAN/OTHER boundary disagreement. Earlier 8-class
# (v3) and 10-class legacy lists below.
PRIMITIVES = [
    "PLAN", "SETUP", "ENUMERATE", "HYPOTHESIZE", "COMPUTE",
    "CHECK", "BACKTRACK", "SUMMARIZE", "OTHER",
]

PRIMITIVES_V3_8 = [
    "PLAN", "ENUMERATE", "HYPOTHESIZE", "COMPUTE",
    "CHECK", "BACKTRACK", "SUMMARIZE", "OTHER",
]

PRIMITIVES_LEGACY_10 = [
    "PLAN", "DECOMPOSE", "ENUMERATE", "HYPOTHESIZE", "COMPUTE",
    "VERIFY", "ERROR_DETECT", "BACKTRACK", "SUMMARIZE", "OTHER",
]

# Map legacy heuristic labels to the 8-class space for comparison.
LEGACY_TO_NEW = {
    "DECOMPOSE":    "PLAN",
    "VERIFY":       "CHECK",
    "ERROR_DETECT": "CHECK",
}


def to_new_taxonomy(label: str) -> str:
    """Map a legacy 10-class label into the 8-class taxonomy."""
    return LEGACY_TO_NEW.get(label, label)

_FENCE_RE = re.compile(r"```(?:json)?\s*(.*?)\s*```", re.DOTALL)


def parse_json_response(text: str | None) -> dict | None:
    """Extract a JSON object from an LLM response.

    Tries: direct json.loads -> markdown fenced block -> first-{ to last-}.
    Returns None on all failures.
    """
    if not text:
        return None
    try:
        return json.loads(text)
    except json.JSONDecodeError:
        pass
    m = _FENCE_RE.search(text)
    if m:
        try:
            return json.loads(m.group(1))
        except json.JSONDecodeError:
            pass
    lo, hi = text.find("{"), text.rfind("}")
    if 0 <= lo < hi:
        try:
            return json.loads(text[lo:hi + 1])
        except json.JSONDecodeError:
            pass
    return None


__all__ = [
    "DeepSeekClient", "with_retry", "PRIMITIVES", "PRIMITIVES_LEGACY_10",
    "LEGACY_TO_NEW", "to_new_taxonomy", "parse_json_response",
]
