import numpy as np
from typing import Any, List

def aggregate_score(scores, method="last"):
    if method == "last":
        return [score[-1] for score in scores]
    elif method == "mean":
        return [np.mean(score) for score in scores]
    elif method == "min":
        return [np.min(score) for score in scores]
    else:
        raise ValueError(f"Unknown aggregate method: {method}")

def add_messages_to_state(s, messages):
    for message in messages:
        # Since we are using OpenAI API, we can just store messages in state if needed,
        # but the current search algorithms mostly use raw text for math.
        # For simplicity, we just append to text.
        s.text += f"\n{message['role']}: {message['content']}\n"

def _softmax(x: np.ndarray) -> np.ndarray:
    shiftx = x - np.max(x)
    exps = np.exp(shiftx)
    return exps / np.sum(exps)

def compute_softmax_divergence(
    p_scores,
    q_scores,
    method: str = "kl",
    eps: float = 1e-12,
):
    p = _softmax(np.asarray(p_scores, dtype=np.float64))
    q = _softmax(np.asarray(q_scores, dtype=np.float64))

    if method.lower() == "kl":
        return float(np.sum(p * np.log((p + eps) / (q + eps))))
    elif method.lower() == "js":
        m = 0.5 * (p + q)
        kl_pm = np.sum(p * np.log((p + eps) / (m + eps)))
        kl_qm = np.sum(q * np.log((q + eps) / (m + eps)))
        return float(0.5 * (kl_pm + kl_qm))
    else:
        raise ValueError(f"Unknown divergence method: {method}. Supported methods are 'kl' and 'js'.")

def compute_top1_mismatch(
    p_scores,
    q_scores,
) -> float:
    if len(p_scores) == 0 or len(q_scores) == 0:
        raise ValueError("Score lists must be non-empty.")
    if len(p_scores) != len(q_scores):
        raise ValueError("Score lists must have the same length.")
    return float(int(np.argmax(p_scores) != np.argmax(q_scores)))

def compute_pairwise_inversion_ratio(
    p_scores,
    q_scores,
) -> float:
    if len(p_scores) == 0 or len(q_scores) == 0:
        raise ValueError("Score lists must be non-empty.")
    if len(p_scores) != len(q_scores):
        raise ValueError("Score lists must have the same length.")

    n = len(p_scores)
    if n < 2:
        return 0.0

    p_order = np.argsort(-np.asarray(p_scores))
    q_order = np.argsort(-np.asarray(q_scores))

    rank_p = np.empty(n, dtype=int)
    rank_q = np.empty(n, dtype=int)
    rank_p[p_order] = np.arange(n)
    rank_q[q_order] = np.arange(n)

    discordant = 0
    for i in range(n):
        for j in range(i + 1, n):
            if (rank_p[i] - rank_p[j]) * (rank_q[i] - rank_q[j]) < 0:
                discordant += 1

    total_pairs = n * (n - 1) // 2
    return discordant / total_pairs

def compute_divergence(
    p_scores,
    q_scores,
    method: str = "softmax_divergence",
    **kwargs,
):
    method = method.lower()
    if method == "softmax_divergence":
        div_type = kwargs.pop("divergence", "kl")
        eps = kwargs.pop("eps", 1e-12)
        return compute_softmax_divergence(p_scores, q_scores, method=div_type, eps=eps)
    elif method == "top1_mismatch":
        return compute_top1_mismatch(p_scores, q_scores)
    elif method == "disorder_pairs":
        return compute_pairwise_inversion_ratio(p_scores, q_scores)
    else:
        raise ValueError(
            f"Unknown divergence method: {method}. Supported values are 'softmax_divergence', 'top1_mismatch', and 'disorder_pairs'."
        )
