import re

def get_user_prompt(prompt: str) -> str:
    match = re.search(r"<\|im_start\|>user\s*(.*?)\s*<\|im_end\|>", prompt, re.DOTALL)
    if match:
        return match.group(1).strip()
    lines = prompt.splitlines()
    result = []
    for line in lines:
        if not line.strip().lower().startswith("system"):
            if line.strip().lower().startswith("user"):
                result.append(line.strip()[4:].strip())
            else:
                result.append(line)
    return "\n".join(result).strip()

def get_assistant_response(text: str) -> str:
    """
    Extract the assistant's response from ChatML format, handling cases
    where the im_start tag might be missing.
    """
    # Look for <|im_start|>assistant followed by everything until <|im_end|> or end of string
    match = re.search(r"<\|im_start\|>assistant\s*(.*?)(?:<\|im_end\|>|$)", text, re.DOTALL)
    if match:
        return match.group(1).strip()
    
    # If we don't find the ChatML tags but the response has XML tags directly
    # Return the entire text up to <|im_end|> if present
    end_tag_index = text.find("<|im_end|>")
    if end_tag_index != -1:
        return text[:end_tag_index].strip()
    
    # If no ChatML tags at all, just return the text as is
    return text.strip()

def extract_xml_answer(text: str) -> str:
    match = re.search(r"<answer>\s*(.*?)\s*</answer>", text, re.DOTALL)
    if match:
        return match.group(1).strip()
    return ""  # fallback if tags are missing or malformed


def extract_hash_answer(text: str) -> str:
    if "####" not in text:
        return text.strip()
    return text.split("####", 1)[1].strip()

def count_xml(text: str) -> float:
    count = 0.0
    if text.count("<thinking>\n") == 1:
        count += 0.225
    if text.count("\n</thinking>\n") == 1:
        count += 0.225
    if text.count("\n<answer>\n") == 1:
        count += 0.225
        count -= len(text.split("\n</answer>")[-1]) * 0.001
    if text.count("\n</answer>\n") == 1:
        count += 0.225
        count -= (len(text.split("\n</answer>")[-1]) - 1) * 0.001
    return count

def create_few_shot_prompt(question, examples, system_prompt, num_examples=2):
    """Create a prompt with few-shot examples formatted as individual chat messages"""

    messages = [{"role": "system", "content": system_prompt}]

    # Take only the requested number of examples
    selected_examples = examples[:num_examples] if examples else []

    for example in selected_examples:
        messages.append({"role": "user", "content": example["similar_question"]})
        messages.append({"role": "assistant", "content": example["full_response"]})

    # Add the actual question to be answered
    messages.append({"role": "user", "content": question})

    return messages


def create_no_shot_prompt(question, system_prompt):
    """Create a prompt without few-shot examples"""

    messages = [
        {"role": "system", "content": system_prompt},
        {"role": "user", "content": f"{question}"}
    ]

    return messages

def convert_messages_to_chatml(messages, add_assistant_prompt=True):
        """
        Convert a list of message dictionaries to the ChatML format with <|im_start|> and <|im_end|> tags.

        Args:
            messages: List of dictionaries with 'role' and 'content' keys
            add_assistant_prompt: If True, adds an assistant prompt after the last user message

        Returns:
            String in ChatML format
        """
        result = []

        for message in messages:
            role = message["role"]
            content = message["content"]

            # Add the start tag with role
            result.append(f"<|im_start|>{role}")

            # Add the content (preserving any existing line breaks)
            result.append(content)

            # Add the end tag
            result.append("<|im_end|>")

        # Check if the last message is from a user and we should add an assistant prompt
        if add_assistant_prompt and messages and messages[-1]["role"] == "user":
            result.append("<|im_start|>assistant\n")
            # Empty content for assistant - the model will generate this part

        # Join everything with newlines
        return "\n".join(result)

SYSTEM_PROMPT = "Please respond in this specific format ONLY:\n<reasoning>\n input your reasoning behind your answer in between these reasoning tags.\n</reasoning>\n<answer>\nyour answer in between these answer tags.\n</answer>\n"
