"""Code security utilities for safe execution of LLM-generated code.

This module provides security checks and sandboxing mechanisms to prevent
malicious or dangerous code from being executed.
"""

import re
import signal
from typing import Tuple, Dict, Any, Optional


class SecurityError(Exception):
    """Raised when code fails security validation."""
    pass


class CodeExecutionTimeout(Exception):
    """Raised when code execution exceeds timeout limit."""
    pass


# Forbidden patterns that indicate potentially dangerous code
FORBIDDEN_PATTERNS = [
    (r'__import__\s*\(', 'Direct import of modules'),
    (r'eval\s*\(', 'Use of eval()'),
    (r'exec\s*\(', 'Use of exec()'),
    (r'compile\s*\(', 'Use of compile()'),
    (r'os\.system\s*\(', 'System command execution'),
    (r'subprocess\s*\.', 'Subprocess execution'),
    (r'open\s*\([^)]*[\'"]w', 'File writing operations'),
    (r'__builtins__', 'Access to builtins'),
    (r'globals\s*\(', 'Access to globals()'),
    (r'locals\s*\(', 'Access to locals()'),
    (r'vars\s*\(', 'Access to vars()'),
    (r'dir\s*\(', 'Directory listing'),
    (r'getattr\s*\(', 'Dynamic attribute access'),
    (r'setattr\s*\(', 'Dynamic attribute setting'),
    (r'delattr\s*\(', 'Dynamic attribute deletion'),
    (r'__code__', 'Code object access'),
    (r'__globals__', 'Globals access'),
    (r'import\s+os\b', 'OS module import'),
    (r'import\s+sys\b', 'Sys module import'),
    (r'from\s+os\s+import', 'OS module import'),
    (r'from\s+sys\s+import', 'Sys module import'),
]


def validate_code_safety(code: str, strict: bool = False) -> Tuple[bool, str]:
    """Validate that code doesn't contain dangerous patterns.
    
    Args:
        code: The Python code to validate
        strict: If True, applies stricter validation rules
        
    Returns:
        Tuple of (is_safe, error_message)
        - is_safe: True if code passes validation
        - error_message: Description of security issue if not safe, empty string if safe
    """
    # Check for forbidden patterns
    for pattern, description in FORBIDDEN_PATTERNS:
        if re.search(pattern, code, re.IGNORECASE):
            return False, f"Security violation: {description} (pattern: {pattern})"
    
    # Additional strict checks
    if strict:
        # Check for attempts to access private attributes
        if re.search(r'\._[_\w]+', code):
            return False, "Access to private/protected attributes not allowed"
        
        # Check for suspicious string operations that might be code injection
        if re.search(r'[\'"]\s*\+\s*[a-zA-Z_]|\w+\s*\+\s*[\'"]', code):
            return False, "Suspicious string concatenation that might lead to code injection"
    
    return True, ""


def create_safe_namespace(env_op: Any, additional_allowed: Optional[Dict[str, Any]] = None) -> Dict[str, Any]:
    """Create a restricted namespace for code execution.
    
    Args:
        env_op: The environment operation object (safe to expose)
        additional_allowed: Additional safe functions/objects to include
        
    Returns:
        Dictionary containing only allowed functions and objects
    """
    # Base safe namespace (no builtins by default)
    safe_namespace = {
        '__builtins__': {},  # Empty builtins for security
        'env_op': env_op,
        'print': print,  # Allow printing for debugging
        'len': len,
        'str': str,
        'int': int,
        'float': float,
        'bool': bool,
        'list': list,
        'dict': dict,
        'tuple': tuple,
        'set': set,
        'range': range,
        'enumerate': enumerate,
        'zip': zip,
        'min': min,
        'max': max,
        'sum': sum,
        'abs': abs,
        'round': round,
        'True': True,
        'False': False,
        'None': None,
    }
    
    # Add additional allowed items
    if additional_allowed:
        safe_namespace.update(additional_allowed)
    
    return safe_namespace


class TimeoutHandler:
    """Context manager for executing code with timeout protection."""
    
    def __init__(self, timeout_seconds: int = 30):
        """Initialize timeout handler.
        
        Args:
            timeout_seconds: Maximum execution time in seconds
        """
        self.timeout_seconds = timeout_seconds
        self.old_handler = None
    
    def _timeout_handler(self, signum, frame):
        """Signal handler for timeout."""
        raise CodeExecutionTimeout(
            f"Code execution exceeded timeout limit of {self.timeout_seconds} seconds"
        )
    
    def __enter__(self):
        """Set up timeout handler."""
        self.old_handler = signal.signal(signal.SIGALRM, self._timeout_handler)
        signal.alarm(self.timeout_seconds)
        return self
    
    def __exit__(self, exc_type, exc_val, exc_tb):
        """Clean up timeout handler."""
        signal.alarm(0)  # Cancel alarm
        if self.old_handler is not None:
            signal.signal(signal.SIGALRM, self.old_handler)
        return False  # Don't suppress exceptions


def execute_code_safely(
    code: str,
    env_op: Any,
    vars: Optional[Dict[str, Any]] = None,
    timeout: int = 30,
    strict_validation: bool = False
) -> Dict[str, Any]:
    """Execute code in a safe sandboxed environment.
    
    Args:
        code: Python code to execute
        env_op: Environment operation object
        vars: Additional variables to pass to the code
        timeout: Maximum execution time in seconds
        strict_validation: Apply strict security validation
        
    Returns:
        The safe namespace after execution (containing any results)
        
    Raises:
        SecurityError: If code fails security validation
        CodeExecutionTimeout: If execution exceeds timeout
        SyntaxError: If code has syntax errors
    """
    # Step 1: Validate code safety
    is_safe, error_msg = validate_code_safety(code, strict=strict_validation)
    if not is_safe:
        raise SecurityError(error_msg)
    
    # Step 2: Create safe namespace
    safe_namespace = create_safe_namespace(env_op, vars)
    
    # Step 3: Execute with timeout protection
    with TimeoutHandler(timeout):
        try:
            exec(code, safe_namespace)
        except CodeExecutionTimeout:
            raise
        except Exception as e:
            # Preserve original exception with context
            raise type(e)(f"Error during code execution: {e}").with_traceback(e.__traceback__)
    
    return safe_namespace


def sanitize_code_for_logging(code: str, max_length: int = 500) -> str:
    """Sanitize code for safe logging (prevent log injection).
    
    Args:
        code: Code to sanitize
        max_length: Maximum length of sanitized code
        
    Returns:
        Sanitized code string safe for logging
    """
    # Remove potential log injection characters
    sanitized = re.sub(r'[\x00-\x1f\x7f-\x9f]', '', code)
    
    # Truncate if too long
    if len(sanitized) > max_length:
        sanitized = sanitized[:max_length] + '... (truncated)'
    
    return sanitized

