import re
from typing import Optional

import numpy as np

_ANSWER_RE = re.compile(r"<answer>\s*(.*?)\s*</answer>", re.IGNORECASE | re.DOTALL)
_BOXED_RE = re.compile(r"\\boxed\s*\{([^}]*)\}")


def _extract_boxed(text: str) -> Optional[str]:
    if not text:
        return None
    matches = _BOXED_RE.findall(text)
    return matches[-1] if matches else None


def _extract_answer_tag(text: str) -> Optional[str]:
    if not text:
        return None
    matches = _ANSWER_RE.findall(text)
    return matches[-1] if matches else None


def _normalize_moves(text: str) -> str:
    if not text:
        return ""
    text = re.sub(r"[\s,]+", "", str(text).upper())
    return "".join(ch for ch in text if ch in {"U", "D", "L", "R"})


def _extract_moves(text: str) -> str:
    tagged = _extract_answer_tag(text)
    if tagged is not None:
        moves = _normalize_moves(tagged)
        if moves:
            return moves
    boxed = _extract_boxed(text)
    if boxed is not None:
        moves = _normalize_moves(boxed)
        if moves:
            return moves
    return ""


def _get_maze_info(extra_info: Optional[dict]) -> Optional[dict]:
    if not extra_info:
        return None
    if isinstance(extra_info.get("interaction_kwargs"), dict):
        maze = extra_info["interaction_kwargs"].get("maze")
        if isinstance(maze, dict):
            return maze
    maze = extra_info.get("maze")
    if isinstance(maze, dict):
        return maze
    return None


def _build_ascii_grid(connection_list: np.ndarray) -> np.ndarray:
    """Render an ASCII grid (size 2*grid_n+1) with '*' walls and '.' corridors."""
    grid_n = int(connection_list.shape[1])
    size = 2 * grid_n + 1
    grid = np.full((size, size), "*", dtype="<U1")

    for r in range(grid_n):
        for c in range(grid_n):
            center_r = 2 * r + 1
            center_c = 2 * c + 1
            grid[center_r, center_c] = "."
            if connection_list[1, r, c]:
                grid[center_r, center_c + 1] = "."
            if connection_list[0, r, c]:
                grid[center_r + 1, center_c] = "."

    return grid


def _nodes_connected(connection_list: np.ndarray, a: np.ndarray, b: np.ndarray) -> bool:
    delta = b - a
    if np.abs(delta).sum() != 1:
        return False
    dim = int(np.argmax(np.abs(delta)))
    clist_node = a if delta.sum() > 0 else b
    r, c = int(clist_node[0]), int(clist_node[1])
    if r < 0 or c < 0 or r >= connection_list.shape[1] or c >= connection_list.shape[2]:
        return False
    return bool(connection_list[dim, r, c])


def compute_score(
    solution_str: str,
    ground_truth: object,
    data_source: Optional[str] = None,
    extra_info: Optional[dict] = None,
    **kwargs,
) -> float:
    """Score 1.0 if the predicted move sequence is a valid ASCII-grid path from S to E."""
    moves = _extract_moves(solution_str)
    if not moves:
        return 0.0

    maze = _get_maze_info(extra_info)
    if not maze:
        return 0.0

    try:
        grid_n = int(maze["grid_n"])
        connection_list = np.asarray(maze["connection_list"], dtype=bool)
        start_pos = np.asarray(maze["start_pos"], dtype=int)
        end_pos = np.asarray(maze["end_pos"], dtype=int)
    except Exception:
        return 0.0

    if connection_list.shape != (2, grid_n, grid_n):
        return 0.0

    if start_pos.shape != (2,) or end_pos.shape != (2,):
        return 0.0

    grid = _build_ascii_grid(connection_list)
    size = int(grid.shape[0])

    def _to_ascii(pos: np.ndarray) -> Optional[np.ndarray]:
        r, c = int(pos[0]), int(pos[1])
        if r < 0 or c < 0 or r >= grid_n or c >= grid_n:
            return None
        return np.array([2 * r + 1, 2 * c + 1], dtype=int)

    pos = _to_ascii(start_pos)
    end_pos_ascii = _to_ascii(end_pos)
    if pos is None or end_pos_ascii is None:
        return 0.0

    for move in moves:
        if move == "U":
            nxt = pos + np.array([-1, 0], dtype=int)
        elif move == "D":
            nxt = pos + np.array([1, 0], dtype=int)
        elif move == "L":
            nxt = pos + np.array([0, -1], dtype=int)
        elif move == "R":
            nxt = pos + np.array([0, 1], dtype=int)
        else:
            return 0.0

        r, c = int(nxt[0]), int(nxt[1])
        if r < 0 or c < 0 or r >= size or c >= size:
            return 0.0
        if grid[r, c] == "*":
            return 0.0
        pos = nxt

    return 1.0 if np.all(pos == end_pos_ascii) else 0.0


def verifier_fn(
    *,
    attempt_text: str,
    ground_truth: object,
    **kwargs,
) -> tuple[bool, float, None]:
    """Verifier wrapper for VerKRetryInteraction callable verifier."""
    score = compute_score(attempt_text, ground_truth, **kwargs)
    return (score > 0.0), float(score), None
