import json
import re
import warnings
import sys
from io import StringIO

from rouge_score import rouge_scorer 
from rdkit import Chem
from rdkit.Chem import AllChem

scorer = rouge_scorer.RougeScorer(['rougeL'], use_stemmer=True)

def extract_json(text):
    """Extract JSON object from text"""
    text = text.replace('```json', '').replace('```', '')
    # Simple pattern: match content enclosed in braces or brackets
    simple_pattern = r'\{.*?\}'  # Non-greedy match for objects
    array_pattern = r'\[.*?\]'   # Non-greedy match for arrays
    
    # Find all possible JSON objects
    json_strings = []
    
    # First look for objects
    for match in re.finditer(simple_pattern, text, re.DOTALL):
        json_str = match.group(0)
        try:
            obj = json.loads(json_str)
            json_strings.append(json_str)
        except json.JSONDecodeError:
            pass
    
    # Then look for arrays (avoid duplicate matching)
    for match in re.finditer(array_pattern, text, re.DOTALL):
        json_str = match.group(0)
        if json_str not in json_strings:  # Avoid duplicates
            try:
                obj = json.loads(json_str)
                json_strings.append(json_str)
            except json.JSONDecodeError:
                pass
    
    # Parse and return JSON objects
    results = []
    for json_str in json_strings:
        try:
            results.append(json.loads(json_str))
        except json.JSONDecodeError as e:
            print(f"Parsing failed: {e}")
    
    if len(results) == 0 or not isinstance(results[0], dict):
        return {}
    
    return results[0]

def extract_number(s):
    """Extract numbers from string"""
    # Use regular expressions to extract all possible numbers (including integers, floats, negatives)
    numbers = re.findall(r'-?\d+\.?\d*', s)
    if numbers:
        return float(numbers[0])  # Return the first found number
    return None  # Return None if no numbers found

def evaluate_numeric(gt, pred, tolerance=0):
    """
    Evaluate numeric answers
    
    Parameters:
        gt: Ground truth answer string
        pred: Predicted answer string
        tolerance: Tolerance range, default is 0
        
    Returns:
        1: Within tolerance range
        0: Outside tolerance range
        None: Unable to extract number
    """
    # Extract numbers from strings
    gt_num = extract_number(gt)
    pred_num = extract_number(pred)
    
    # Check if numbers were successfully extracted
    if gt_num is None or pred_num is None:
        return None
    
    # Convert to float type
    gt_float = float(gt_num)
    pred_float = float(pred_num)
    
    # Check if within tolerance range
    if (gt_float - tolerance) <= pred_float <= (gt_float + tolerance):
        return 1
    return 0

def format_list(items):
    """
    Format list elements into specified string format
    - Two elements: "xx and xx"
    - Three or more elements: "xx, xx, and xx"
    """
    if len(items) == 0:
        return ""
    elif len(items) == 1:
        return items[0]
    elif len(items) == 2:
        return f"{items[0]} and {items[1]}"
    else:
        # Handle cases with three or more elements
        return ", ".join(items[:-1]) + f", and {items[-1]}"


def evaluate_string(gt, pred):
    """
    Evaluate string answers, calculate rouge-l score
    
    Parameters:
        gt: Ground truth answer string
        pred: Predicted answer string
        
    Returns:
        rouge-l score
    """
    if isinstance(pred, list):
        pred = format_list(pred)
    # Calculate rouge-l score
    scores = scorer.score(gt, pred)
    return scores['rougeL'].fmeasure

class HiddenPrints:
    """Context manager to hide all print outputs"""
    def __enter__(self):
        self._original_stdout = sys.stdout
        self._original_stderr = sys.stderr
        sys.stdout = StringIO()
        sys.stderr = StringIO()

    def __exit__(self, exc_type, exc_val, exc_tb):
        sys.stdout = self._original_stdout
        sys.stderr = self._original_stderr

def evaluate_smiles(gt, pred):
    """Evaluate SMILES answers, completely hide all RDKit outputs"""
    # Use both warnings filtering and output redirection
    with warnings.catch_warnings(), HiddenPrints():
        warnings.simplefilter("ignore")
        try:
            # Try to create molecule objects, all outputs will be hidden
            mol_gt = Chem.MolFromSmiles(gt)
            mol_pred = Chem.MolFromSmiles(pred)
            
            # Check if molecules are valid
            if mol_gt is None or mol_pred is None:
                return evaluate_string(gt, pred)
            
            # Calculate Tanimoto similarity
            fp_gt = AllChem.GetMorganFingerprintAsBitVect(mol_gt, 2, nBits=1024)
            fp_pred = AllChem.GetMorganFingerprintAsBitVect(mol_pred, 2, nBits=1024)
            similarity = AllChem.DataStructs.TanimotoSimilarity(fp_gt, fp_pred)
            
            return similarity
            
        except Exception as e:
            # Fall back to string evaluation when exception occurs
            return evaluate_string(gt, pred)
