import json
from typing import List, Dict, Any
import re
import logging
from collections import Counter, defaultdict
import string


def transform_msg_to_json(raw_messages: list) -> list:
    json_msgs = []

    for message in raw_messages:
        if type(message) is dict:
            role = message.get('role')
            content = message.get('content')

            if role in ['system', 'user', 'tool']:
                json_msgs.append({
                    'role': role,
                    'content': content
                })
            elif role == 'assistant':
                json_msgs.append(message)
            continue
        else:
            role = message.role if hasattr(message, 'role') else None
            if role != 'assistant':
                raise ValueError(
                    f"Unsupported role: {role}. Only 'assistant' should be ChatCompletionMessage.")
            content = message.content if hasattr(message, 'content') else ''
            reasoning_content = message.reasoning_content if hasattr(
                message, 'reasoning_content') else ''
            tool_call_list = message.tool_calls
            log_tool_call_list = []
            if tool_call_list:
                for tool_call_item in tool_call_list:
                    function_name = tool_call_item.function.name
                    function_args = tool_call_item.function.arguments
                    log_item = {'function': {
                        'name': function_name,
                        'arguments': function_args
                    }}
                    log_tool_call_list.append(log_item)
            final_dict = {
                'role': 'assistant',
                'content': content,
                'tool_calls': log_tool_call_list
            }
            if reasoning_content:
                final_dict['reasoning_content'] = reasoning_content
            json_msgs.append(final_dict)
    return json_msgs


def parse_assistant_response(response) -> str:
    if isinstance(response, str):
        return response[-1500:]
    if not isinstance(response, list) or len(response) < 1:
        return ""
    response_list = response[-2:]
    full_content = [
        (item.get("content") or "No content")
        for item in response_list
        if isinstance(item, dict) and item.get("role") == "assistant"
    ]
    return "\n".join(full_content)[-1500:]


def normalize_text(s: str) -> str:
    if not isinstance(s, str):
        return ""
    return re.sub(r'\s+', ' ', s.lower().translate(str.maketrans("", "", string.punctuation))).strip()


def extract_answer_tag(text: str) -> str | None:
    if not text:
        return None
    match = None
    for m in re.finditer(r'<answer>(.*?)</answer>', text, re.DOTALL):
        match = m
    return match.group(1).strip() if match else text


def calculate_f1_score(prediction: str, ground_truth: str) -> float:
    pred_tokens, truth_tokens = prediction.split(), ground_truth.split()
    if not truth_tokens and not pred_tokens:
        return 1.0
    if not truth_tokens or not pred_tokens:
        return 0.0
    common_tokens = Counter(pred_tokens) & Counter(truth_tokens)
    num_same = sum(common_tokens.values())
    if num_same == 0:
        return 0.0
    precision = num_same / len(pred_tokens)
    recall = num_same / len(truth_tokens)
    return (2 * precision * recall) / (precision + recall)
