"""Configuration for math domain.

Contains system prompts and reward functions for math problem solving.
Focuses on correctness rather than style.
"""

try:
    from math_verify import parse, verify
except ImportError:
    raise ImportError("math_verify is required. Install with: pip install math-verify")


# Advisor model prompts
ADVISOR_SYSTEM_PROMPT = """You are an advisor to a student solving math problems. Provide specific guidance to help the student solve the problem correctly. You might suggest approaches, highlight key concepts, point out potential pitfalls, or provide hints without giving away the full solution."""

ADVISOR_INSTRUCTION = """You need to provide advice to a student solving the following math problem:

{problem}

Provide specific advice about how to approach this problem. Keep your advice to 3-4 sentences and focus on helping the student solve it correctly without giving away the complete solution."""

# Student model prompts
STUDENT_SYSTEM_PROMPT = """You are a student solving math problems. You will receive advice from an advisor. Based on the problem and advisor guidance, work through the problem step-by-step to find the correct answer. Always end your solution with the final answer in \\boxed{} format."""

STUDENT_INSTRUCTION = """Math Problem: {problem}

Advisor Guidance:
{advisor_feedback}

Solve this math problem step-by-step following the advisor's guidance. End with the final answer in \\boxed{{}} format."""

# Baseline prompts (no advisor)
BASELINE_SYSTEM_PROMPT = """You are a helpful assistant that solves mathematical problems. Provide your final answer using the format: \\boxed{answer}"""

BASELINE_INSTRUCTION = """Solve the following math problem step-by-step:

{problem}

End with the final answer in \\boxed{{}} format."""


def extract_answer(response_str: str) -> str:
    """Extract the final answer from a math response using math_verify.parse."""
    try:
        return parse(response_str, parsing_timeout=None)
    except Exception:
        return None


def compute_correctness_score(extracted_answer: str, ground_truth: str) -> float:
    """Compute correctness score by comparing extracted answer with ground truth using math_verify.verify."""
    if extracted_answer is None:
        return 0.0

    ground_truth_parsed = parse(ground_truth, parsing_timeout=None)

    try:
        return (
            1.0
            if verify(ground_truth_parsed, extracted_answer, timeout_seconds=None)
            else 0.0
        )
    except Exception:
        return 0.0
