import re
from typing import Optional, Tuple

# Sanitizer error message patterns
SANITIZER_ERROR_PATTERNS = [
    "ERROR: AddressSanitizer:",
    "ERROR: MemorySanitizer:",
    "WARNING: MemorySanitizer:",
    "UndefinedBehaviorSanitizer:DEADLYSIGNAL",
    "ERROR: LeakSanitizer:",
    "SUMMARY: UndefinedBehaviorSanitizer: undefined-behavior",
]

# Sanitizer report patterns
SANITIZER_START_PATTERN = r"==\d+==(?:ERROR|WARNING): (\w+)Sanitizer:"
SANITIZER_END_PATTERN = r"==\d+==ABORTING"
# Stack trace pattern that often appears at the end of sanitizer reports
STACK_TRACE_END_PATTERN = r"\s+#\d+ 0x[0-9a-f]+"

# Additional sanitizer error indicators for fallback detection
SANITIZER_INDICATORS = [
    "AddressSanitizer",
    "LeakSanitizer",
    "UndefinedBehaviorSanitizer",
    "ThreadSanitizer",
    "MemorySanitizer",
]


def extract_sanitizer_report(container_output: str) -> Optional[str]:
    """Extract the sanitizer report from container output using regex.

    Args:
        container_output: Container log output

    Returns:
        Extracted sanitizer report or None if no report found
    """
    # Look for complete sanitizer report with both start and end patterns
    start_match = re.search(SANITIZER_START_PATTERN, container_output)
    end_match = re.search(SANITIZER_END_PATTERN, container_output)

    if start_match and end_match:
        # Get the start and end positions of the report
        start_pos = start_match.start()
        end_pos = end_match.end()

        # Make sure end_pos comes after start_pos
        if end_pos > start_pos:
            # Extract the complete report
            return container_output[start_pos:end_pos]

    # If we have a start match but no end match, try to find the last stack trace line
    if start_match and not end_match:
        start_pos = start_match.start()
        # Find all stack trace lines
        stack_trace_matches = list(
            re.finditer(STACK_TRACE_END_PATTERN, container_output[start_pos:])
        )
        if stack_trace_matches:
            # Use the last stack trace line as the end point (plus some buffer)
            last_match = stack_trace_matches[-1]
            end_pos = (
                # Find the position after the last stack trace match
                start_pos + last_match.end()
            )
            # Find the next newline after the last stack trace match
            next_newline_pos = container_output.find("\n", end_pos)
            if next_newline_pos != -1:
                end_pos = next_newline_pos + 1  # Include the newline
            end_pos = min(end_pos, len(container_output))
            return container_output[start_pos:end_pos]

    # If we can't find a complete report, check if any sanitizer indicators exist
    if any(indicator in container_output for indicator in SANITIZER_ERROR_PATTERNS):
        # Extract context around the first indicator found
        for indicator in SANITIZER_ERROR_PATTERNS:
            if indicator in container_output:
                idx = container_output.find(indicator)
                # Get up to 1000 characters before and after the indicator
                start_idx = max(0, idx - 1000)
                end_idx = min(len(container_output), idx + 1000)
                return container_output[start_idx:end_idx]

    return None


def check_sanitizer_errors(container_output: str) -> Tuple[bool, Optional[str]]:
    """Check if container output contains sanitizer errors and extract the report.

    Args:
        container_output: Container log output

    Returns:
        Tuple of (has_errors, error_report) where:
        - has_errors: True if sanitizer errors found, False otherwise
        - error_report: The extracted sanitizer report or None if no report found
    """
    sanitizer_report = extract_sanitizer_report(container_output)

    if sanitizer_report:
        # If we have a report, return it with True for has_errors
        return True, sanitizer_report

    # Fallback check for any sanitizer indicator
    # has_errors = any(
    #     indicator in container_output for indicator in SANITIZER_INDICATORS
    # )
    # return has_errors, container_output if has_errors else None
    return False, None
