# compliance_checks.py
# Post-generation compliance/audit checks:
#   - toxicity / profanity heuristics
#   - PHI / HIPAA sensitive pattern detection (SSN, phone, emails, addresses)
#   - banned phrases / policy rules
# If checks fail an 'escalate' flag is returned with reasons.

from typing import Tuple, List, Dict
import re


# minimal profanity list (extend in production or use specialized libs)
_PROFANITY = {"fuck", "shit", "damn", "bastard", "idiot"}

# PHI patterns (simplified)
_RE_EMAIL = re.compile(r"[a-zA-Z0-9_.+-]+@[a-zA-Z0-9-]+\.[a-zA-Z0-9-.]+")
_RE_PHONE = re.compile(r"(?:\+?\d{1,3}[-.\s]?)?(?:\(?\d{2,4}\)?[-.\s]?)?\d{3,4}[-.\s]?\d{3,4}")
_RE_SSN = re.compile(r"\b\d{3}-\d{2}-\d{4}\b")  # US SSN pattern
_RE_BANK_ACC = re.compile(r"\b(?:\d{9,18})\b")  # naive bank account / routing guess

def detect_profanity(text: str) -> List[str]:
    found = []
    low = text.lower()
    for w in _PROFANITY:
        if w in low:
            found.append(w)
    return found

def detect_phi(text: str) -> List[Tuple[str, str]]:
    """
    Detect potential PHI matches. Returns list of tuples (type, matched_str).
    """
    hits = []
    for m in _RE_EMAIL.findall(text):
        hits.append(("email", m))
    for m in _RE_PHONE.findall(text):
        # filter out very short numeric matches
        if len(re.sub(r"\D", "", m)) >= 7:
            hits.append(("phone", m))
    for m in _RE_SSN.findall(text):
        hits.append(("ssn", m))
    for m in _RE_BANK_ACC.findall(text):
        if len(m) >= 9 and len(m) <= 18:
            hits.append(("bank_acc", m))
    return hits

def run_compliance(response: str, constraint_set=None) -> Tuple[bool, Dict]:
    """
    Run a set of compliance checks on the generated response.
    Returns (pass_flag:bool, reasons:dict).
    If pass_flag == False, it's recommended to escalate.
    """
    reasons = {}
    pass_flag = True

    profanity = detect_profanity(response)
    if profanity:
        pass_flag = False
        reasons["profanity"] = profanity

    phi = detect_phi(response)
    if phi:
        pass_flag = False
        reasons["phi"] = phi

    # constraint set checks (e.g., banned phrases)
    if constraint_set is not None:
        if not constraint_set.is_allowed(response):
            pass_flag = False
            reasons["constraint_violation"] = "banned phrase matched"

    # basic length/content sanity checks
    if len(response.strip()) == 0:
        pass_flag = False
        reasons["empty_response"] = True

    # Add other checks (toxicity models, medical misinformation detectors, privacy filters) here.
    return pass_flag, reasons

def escalate(response: str, reasons: Dict):
    """
    Action to take if compliance fails. This is a placeholder:
      - log the issue
      - notify clinician/human-in-the-loop
      - store the conversation for review
    """
    # in production: send to message queue/alerting system / database
    print("ESCALATION TRIGGERED")
    print("Reasons:", reasons)
    # implement other actions as needed (webhook, email, etc.)
