"""
EvaluatorUnifiedJudge class
===================================
Standalone version used inside `Decoy-for-the-Judge/standalone_jailbreak`.

IMPORTANT:
- This file uses `Decoy-for-the-Judge/unified_judge.py` (not `unified_judge_framework.py`).
- The caller script should ensure the Decoy repo root is on `sys.path` so `import unified_judge` works.
"""
import logging
import os
from jb_datasets.instance import Instance
from jb_datasets.jailbreak_datasets import JailbreakDataset
from metrics.Evaluator.Evaluator import Evaluator
from typing import Optional

from unified_judge import create_judge, JudgeEvaluator


class EvaluatorUnifiedJudge(Evaluator):
    """
    Evaluator that uses `Decoy-for-the-Judge/unified_judge.py` for evaluation.
    
    This is a drop-in replacement for EvaluatorGenerativeGetScore that uses
    the unified judge framework with the 'generative' judge type (1-10 scoring scale).
    """
    
    def __init__(
        self,
        eval_model,
        model_name: Optional[str] = None,
        temperature: float = 0.0,
        seed: Optional[int] = None,
        max_completion_tokens: int = 1000,
        provider: Optional[str] = None,
        use_local: bool = False,
        local_base_url: str = "http://localhost:30000/v1",
        **kwargs
    ):
        """
        Initialize the evaluator with unified judge framework.
        
        :param eval_model: The EasyJailbreak model object (OpenaiModel, HuggingfaceModel, etc.)
        :param str model_name: Override model name. If None, will try to extract from eval_model
        :param float temperature: Generation temperature (default: 0.0)
        :param int seed: Random seed for reproducibility (OpenAI only)
        :param int max_completion_tokens: Maximum completion tokens
        :param str provider: API provider ("openai", "gemini", "claude", or None for auto-detect)
        :param bool use_local: Whether to use local API
        :param str local_base_url: Local API base URL
        :param **kwargs: Additional parameters passed to create_judge
        """
        super().__init__(eval_model=eval_model)
        
        # Extract model name from eval_model if not provided
        if model_name is None:
            if hasattr(eval_model, 'model_name'):
                model_name = eval_model.model_name
            else:
                raise ValueError("model_name must be provided or eval_model must have a model_name attribute")
        
        # Detect provider from model name if not provided
        if provider is None:
            model_name_lower = model_name.lower()
            if model_name_lower.startswith("gemini"):
                provider = "gemini"
            elif model_name_lower.startswith("claude"):
                provider = "claude"
            else:
                provider = "openai"
        
        # Check if using local API (for OpenAI-compatible models)
        # Only auto-detect local_base_url if use_local was explicitly set to True by caller
        # If use_local is False (default), respect that and don't auto-detect from base_url
        # This prevents accidentally using local server when OpenAI API is intended
        if use_local:
            # If use_local was explicitly True, but local_base_url not provided or is default, try to detect from eval_model
            if not local_base_url or local_base_url == "http://localhost:30000/v1":
                detected_base_url = None
                if hasattr(eval_model, 'base_url') and getattr(eval_model, 'base_url'):
                    detected_base_url = getattr(eval_model, 'base_url')
                elif hasattr(eval_model, 'client') and hasattr(eval_model.client, 'base_url') and getattr(eval_model.client, 'base_url'):
                    detected_base_url = getattr(eval_model.client, 'base_url')
                
                if detected_base_url:
                    local_base_url = str(detected_base_url)
        # If use_local is False, don't auto-detect - use OpenAI API as intended
        
        # Handle determinism: if seed is None, check ENABLE_DETERMINISM environment variable
        # (matches Multi-turn-jailbreak behavior: default enabled, seed=123)
        if seed is None:
            # Prefer per-role override for eval/judge if present.
            det_env = os.getenv("ENABLE_DETERMINISM_EVAL")
            if det_env is not None:
                enable_determinism = det_env.lower() == "true"
            else:
                enable_determinism = os.getenv("ENABLE_DETERMINISM", "true").lower() == "true"
            if enable_determinism:
                seed = 123  # Default seed for determinism
            # If ENABLE_DETERMINISM=false, seed remains None (no determinism)
        
        # Create the unified judge evaluator
        self.judge_evaluator = create_judge(
            judge_type='pair',
            model_name=model_name,
            temperature=temperature,
            seed=seed,
            max_completion_tokens=max_completion_tokens,
            provider=provider,
            use_local=use_local,
            local_base_url=local_base_url,
            include_reason=False,
            include_confidence=False,
            **kwargs
        )
        
        # Track call count for compatibility with original evaluator
        self._call_count = 0
        
        # Preserve original generate method and add call count tracking
        if hasattr(self.eval_model, 'generate'):
            original_generate = self.eval_model.generate
            # Try to add count_calls and calls attributes if they don't exist
            if not hasattr(original_generate, 'count_calls'):
                # Create a wrapper that tracks calls
                class GenerateWrapper:
                    def __init__(self, original_gen, evaluator):
                        self._original = original_gen
                        self._evaluator = evaluator
                        # Preserve original attributes
                        for attr in dir(original_gen):
                            if not attr.startswith('_') and attr not in ['count_calls', 'calls']:
                                try:
                                    setattr(self, attr, getattr(original_gen, attr))
                                except:
                                    pass
                    
                    def __call__(self, *args, **kwargs):
                        return self._original(*args, **kwargs)
                    
                    @property
                    def count_calls(self):
                        return self._evaluator._call_count
                    
                    @property
                    def calls(self):
                        return self._evaluator._call_count
                
                self.eval_model.generate = GenerateWrapper(original_generate, self)
    
    def _evaluate(self, instance: Instance, **kwargs):
        """
        Evaluates a single instance and appends the result to the instance's evaluation results.
        
        :param ~Instance instance: The instance to be evaluated.
        :param **kwargs: Additional keyword arguments (for compatibility)
        :return: None. The method updates the instance's eval_results attribute.
        """
        # Get query and response from instance
        query = instance.query
        if not hasattr(instance, 'target_responses') or not instance.target_responses:
            logging.warning(f"Instance has no target_responses, using empty string")
            response = ""
        else:
            # Use the last response if multiple responses exist
            response = instance.target_responses[-1] if isinstance(instance.target_responses, list) else instance.target_responses
        
        # Evaluate using unified judge framework
        try:
            # Increment call count
            self._call_count += 1
            
            result = self.judge_evaluator.infer_single(query, response)
            # include_reason/include_confidence are disabled by default; we only need the numeric score.
            if isinstance(result, (list, tuple)):
                score = result[0] if result else None
            else:
                score = result
            
            # Handle None score (error case)
            if score is None:
                logging.warning(f"Judge evaluator returned None score. Using default score of 1.")
                score = 1
            else:
                # Ensure score is an integer within judge range (default 1..10)
                try:
                    score = int(score)
                    if score < 1:
                        score = 1
                    elif score > 10:
                        score = 10
                except (ValueError, TypeError):
                    logging.warning(f"Invalid score format: {score}. Using default score of 1.")
                    score = 1
            
            # Append score to eval_results (compatible with EvaluatorGenerativeGetScore)
            instance.eval_results.append(score)
            
        except Exception as e:
            logging.error(f"Error in unified judge evaluation: {e}")
            # On error, append default score of 1 (same as original EvaluatorGenerativeGetScore)
            instance.eval_results.append(1)

