from sentence_transformers import SentenceTransformer, util
from bert_score import score


sbert_model = SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2")

def semantic_evaluation(sent1, sent2, method="sbert", lang="zh"):
    """
    计算两个句子的语义相似度评价指标
    
    参数:
        sent1 (str): 句子1
        sent2 (str): 句子2
        method (str): 'sbert' (Sentence-BERT) 或 'bertscore'
        lang (str): BERTScore 语言代码 ('zh' 中文, 'en' 英文)
    
    返回:
        dict: 相似度评价结果
    """
    
    if method.lower() == "sbert":
        
        emb1 = sbert_model.encode(sent1, convert_to_tensor=True)
        emb2 = sbert_model.encode(sent2, convert_to_tensor=True)
        sim = max(util.cos_sim(emb1, emb2).item(), 0)
        return {"Sentence-BERT Similarity": sim}
    
    elif method.lower() == "bertscore":
        
        P, R, F1 = score([sent1], [sent2], lang=lang, verbose=False)
        return {
            "BERTScore Precision": P.item(),
            "BERTScore Recall": R.item(),
            "BERTScore F1": F1.item()
        }
    
    else:
        raise ValueError("method 必须是 'sbert' 或 'bertscore'")
if __name__ == "__main__":
    
    s1 = "这只猫在垫子上。"
    s2 = "猫正坐在垫子上。"

    print("SBERT:", semantic_evaluation(s1, s2, method="sbert"))
    print("BERTScore:", semantic_evaluation(s1, s2, method="bertscore", lang="zh"))
