import re
from typing import Iterable, Optional

from verl.utils.reward_score.math_reward import is_equiv, last_boxed_only_string, remove_boxed

_NUM_RE = re.compile(r"-?\d[\d,]*(?:\.\d+)?")


def _extract_boxed_answer(solution_str: str) -> Optional[str]:
    if not solution_str:
        return None
    boxed = last_boxed_only_string(solution_str)
    if boxed is not None:
        try:
            return remove_boxed(boxed)
        except Exception:
            pass
    matches = re.findall(r"\\boxed\s*\{([^}]*)\}", solution_str)
    return matches[-1] if matches else None


def _basic_normalize(text: str) -> str:
    if text is None:
        return ""
    text = str(text).replace("$", "").replace(",", "").strip()
    if re.fullmatch(r"-?\d+(?:\.\d+)?\.", text):
        text = text[:-1]
    return text


def _last_number(text: str) -> Optional[str]:
    matches = _NUM_RE.findall(text or "")
    if not matches:
        return None
    return matches[-1].replace(",", "").strip()


def _iter_ground_truths(ground_truth: object) -> Iterable[str]:
    if ground_truth is None:
        return []
    if isinstance(ground_truth, (list, tuple, set)):
        return [str(item) for item in ground_truth]
    return [str(ground_truth)]


def compute_score(
    solution_str: str,
    ground_truth: object,
    data_source: Optional[str] = None,
    extra_info: Optional[dict] = None,
    **kwargs,
) -> float:
    """Score answers by extracting the last boxed value and comparing to ground truth."""
    extracted = _extract_boxed_answer(solution_str)
    if extracted is None:
        return 0.0

    pred = _basic_normalize(extracted)
    if not pred:
        return 0.0

    for gt in _iter_ground_truths(ground_truth):
        gt_norm = _basic_normalize(gt)
        if not gt_norm:
            continue
        if is_equiv(pred, gt_norm):
            return 1.0
        pred_num = _last_number(pred)
        gt_num = _last_number(gt_norm)
        if pred_num and gt_num and pred_num == gt_num:
            return 1.0

    return 0.0


def verifier_fn(
    *,
    attempt_text: str,
    ground_truth: object,
    **kwargs,
) -> tuple[bool, float, None]:
    """Verifier wrapper for VerKRetryInteraction callable verifier."""
    score = compute_score(attempt_text, ground_truth, **kwargs)
    return (score > 0.0), float(score), None
