
from __future__ import annotations
from typing import List, Dict, Any
import json

def exact_match(a: str, b: str) -> bool:
    return a.strip() == b.strip()

def edit_distance(a: str, b: str) -> int:
    if a == b: return 0
    m, n = len(a), len(b)
    dp = list(range(n+1))
    for i in range(1, m+1):
        prev = dp[0]
        dp[0] = i
        for j in range(1, n+1):
            cur = dp[j]
            dp[j] = min(
                dp[j] + 1,
                dp[j-1] + 1,
                prev + (a[i-1] != b[j-1])
            )
            prev = cur
    return dp[n]

def edit_similarity(a: str, b: str) -> float:
    m = max(1, max(len(a), len(b)))
    return 1.0 - (edit_distance(a, b) / m)

def _ngrams(tokens: List[str], n: int):
    return [tuple(tokens[i:i+n]) for i in range(0, max(0, len(tokens)-n+1))]

def bleu(ref: str, hyp: str, max_n: int = 4) -> float:
    import collections
    refs = ref.split()
    hyps = hyp.split()
    if not hyps: return 0.0
    precisions = []
    for n in range(1, max_n+1):
        R = collections.Counter(_ngrams(refs, n))
        H = collections.Counter(_ngrams(hyps, n))
        clip = sum(min(H[g], R[g]) for g in H)
        total = sum(H.values()) or 1
        precisions.append(clip/total)
    prod = 1.0
    for p in precisions:
        prod *= max(1e-9, p)
    return prod ** (1.0/max_n)

def lcs(a: List[str], b: List[str]) -> int:
    m, n = len(a), len(b)
    dp = [0]*(n+1)
    for i in range(1, m+1):
        prev = 0
        for j in range(1, n+1):
            tmp = dp[j]
            if a[i-1] == b[j-1]:
                dp[j] = prev + 1
            else:
                dp[j] = max(dp[j], dp[j-1])
            prev = tmp
    return dp[n]

def rouge_l(ref: str, hyp: str) -> float:
    r = ref.split(); h = hyp.split()
    if not r or not h: return 0.0
    L = lcs(r, h)
    P = L/len(h); R = L/len(r)
    if P+R == 0: return 0.0
    return 2*P*R/(P+R)

def canon_json(s: str) -> str:
    try:
        obj = json.loads(s)
        return json.dumps(obj, sort_keys=True, separators=(",",":"))
    except Exception:
        return s.strip()

def json_exact(a: str, b: str) -> bool:
    return canon_json(a) == canon_json(b)

def brier_score(probs: List[float], golds: List[int]) -> float:
    n = min(len(probs), len(golds))
    if n == 0: return 0.0
    return sum((probs[i]-golds[i])**2 for i in range(n)) / n

def topk_consistency(pred_samples: List[str]) -> float:
    if not pred_samples: return 0.0
    from collections import Counter
    tops = [canon_json(p) if p else "" for p in pred_samples]
    c = Counter(tops).most_common(1)[0][1]
    return c/len(pred_samples)
