# -*- coding: utf-8 -*-
from typing import List, Dict
import numpy as np, torch
from sentence_transformers import SentenceTransformer
from config import ST_MODEL_NAME

_DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
_ST = SentenceTransformer(ST_MODEL_NAME, device=_DEVICE)
_ST.max_seq_length = max(128, getattr(_ST, "max_seq_length", 256))
_ST.eval()

_EMB_CACHE: Dict[str, np.ndarray] = {}

def encode_cached(texts: List[str]) -> List[np.ndarray]:
    to_compute = [t for t in texts if t not in _EMB_CACHE]
    if to_compute:
        vecs = _ST.encode(to_compute, convert_to_numpy=True, device=_DEVICE, normalize_embeddings=True)
        for t, v in zip(to_compute, vecs):
            _EMB_CACHE[t] = v.astype(np.float32, copy=False)
    return [_EMB_CACHE[t] for t in texts]

def sim_query_to_cands(query: str, candidates: List[str]) -> List[float]:
    if not candidates: return []
    qv = encode_cached([query])[0]
    cvs = encode_cached(candidates)
    return [float(np.dot(qv, cv)) for cv in cvs]
