import sys
from typing import Optional, Dict
from og_ego_prim.guardrail.base_guardrail_model import BaseGuardrailModel

# Import EMBGuard from src package (path is set in og_ego_prim/__init__.py)
from src.guardrail import EMBGuard


class LLMGuardrailModel(BaseGuardrailModel):
    """
    Guardrail model implementation using LLM
    Can use any model (GPT-4, Claude, Llama, etc.) using EMBGuard
    """
    
    def __init__(
        self,
        provider: str,
        model_config: Dict,
        task_instruction: Optional[str] = None,
        use_few_shot: bool = True,
        use_thinking: bool = False
    ):
        """
        Args:
            provider: LLM provider ("openai", "openrouter", "vllm", "claude", "gemini")
            model_config: Model configuration dictionary
            task_instruction: Task instruction (optional, currently not used)
            use_few_shot: Whether to include few-shot examples (default: True)
            use_thinking: Whether to use thinking mode (default: False)
        """
        self.embguard = EMBGuard(provider=provider, model_config=model_config)
        self.task_instruction = task_instruction
        self.use_few_shot = use_few_shot
        self.use_thinking = use_thinking
    
    def is_risky(
        self, 
        action_nl: str, 
        image_file: Optional[str] = None,
        caution: Optional[str] = None
    ) -> Dict[str, str]:
        """
        Receive action_nl and image, ask LLM and return risky status
        
        Args:
            action_nl: Action description converted to natural language
            image_file: Captured image file path
            caution: Safety warning (optional, currently not used)
            
        Returns:
            Dict[str, str]: {
                'potential_risk': 'risky' or 'benign',
                'risk_type': risk type or 'none',
                'hazard': hazard description or 'none'
            }
        """
        # Call EMBGuard's evaluate method
        result_dict = self.embguard.evaluate(
            action=action_nl,
            image=image_file,
            use_few_shot=self.use_few_shot,
            use_thinking=self.use_thinking
        )
        
        # Extract parsed_response from EMBGuard's return value
        parsed_response = result_dict.get('parsed_response', {})
        
        # Format result
        result = {
            'potential_risk': parsed_response.get('potential_risk', 'benign'),
            'risk_type': parsed_response.get('risk_type', 'none'),
            'hazard': parsed_response.get('hazard', 'none')
        }
        
        # Normalize potential_risk value ('safe' -> 'benign', 'risky'/'unsafe' -> 'risky')
        potential_risk = result.get('potential_risk', 'benign').lower()
        if potential_risk == 'safe':
            result['potential_risk'] = 'benign'
        elif potential_risk in ['unsafe', 'risky']:
            result['potential_risk'] = 'risky'
        else:
            result['potential_risk'] = potential_risk
        
        # Output judgment result
        risk_status = result.get('potential_risk', 'unknown')
        display_status = 'safe' if risk_status == 'benign' else risk_status
        print(f"[guardrail] potential_risk: {display_status}, risk_type: {result.get('risk_type', 'none')}, hazard: {result.get('hazard', 'none')}")
        sys.stdout.flush()
        
        return result

