from pathlib import Path
from logging import Logger
import re
import subprocess
import json
from typing import List, Optional, Tuple

def cloneRepo(repoPath: Path, repoUrl: str, logger: Logger) -> None:
    """Clone the repository into repoPath if it does not exist."""
    # Initialize repository
    if not repoPath.exists():
        logger.info(f"Cloning {repoUrl} to {repoPath}...")
        result = subprocess.run(["git", "clone", repoUrl, 
                    str(repoPath)], capture_output=True, text=True)
        if result.returncode != 0:
            logger.error(f"Failed to clone repository: {result.stderr}")
            raise RuntimeError("Failed to clone repository")
    else:
        logger.info(f"Using existing repository at {repoPath}")
    
    logger.info(f"MegaCoder initialized with repo at {repoPath}")

def checkoutCommit(repoPath: Path, commitId: str, backportCommitsJsonPath: Optional[Path], logger: Logger) -> bool:
    """Checkout a specific commit in an already-cloned repo and apply backports (if backportCommitsJsonPath is specified)."""
#    return True
    logger.info(f"Checking out commit {commitId} in repo {repoPath}")
    result = subprocess.run(["git", "checkout", "-f", commitId], cwd=repoPath, capture_output=True)
    
    if result.returncode != 0:
        logger.info(f"Commit {commitId} not found locally, trying to fetch...")
        # Try to fetch the specific commit
        fetchResult = subprocess.run(["git", "fetch", 'origin', f'{commitId}:refs/remotes/origin/orphaned-commit'], 
                        cwd=repoPath, capture_output=True)
        
        if fetchResult.returncode != 0:
            logger.error(f"Failed to fetch commit as if it's a dangling commit: {fetchResult.stderr.decode()}")
            return False
        
        checkoutResult = subprocess.run(["git", "checkout", "-f", commitId], cwd=repoPath, capture_output=True)
        if checkoutResult.returncode != 0:
            logger.error(f"Failed to checkout after fetch: {checkoutResult.stderr.decode()}")
            return False
    
    if backportCommitsJsonPath:
        return applyFixBackports(repoPath, backportCommitsJsonPath, logger)
    return True

def canonicalizeCommitTitle(title: str) -> str:
    """Canonicalize commit title by removing prefixes."""
    commitPrefixes = [
        'UPSTREAM:', 'CHROMIUM:', 'FROMLIST:', 
        'BACKPORT:', 'FROMGIT:', 'net-backports:'
    ]
    for prefix in commitPrefixes:
        if title.find(prefix) == 0:
            return (title[len(prefix):]).strip()
    return title.strip()

def getCommitIdByMessage(repoPath: Path, message: str, logger: Logger) -> Optional[str]:
    """Find commit ID by message content."""
    logger.debug(f"Searching for commit with message: {message}")
    result = subprocess.run(["git", "log", "-F", "--grep", message], 
                cwd=repoPath, capture_output=True, text=True)
    
    if result.returncode == 0 and result.stdout:
        commit_id = result.stdout.split('\n', maxsplit=1)[0].split(' ')[1]
        logger.debug(f"Found commit: {commit_id}")
        return commit_id
    
    logger.debug("No matching commit found")
    return None

def checkAncestorByCommitId(repoPath: Path, ancestorCommitId: str, logger: Logger) -> bool:
    """Check if a commit is an ancestor of HEAD."""
    logger.debug(f"Checking if {ancestorCommitId} is ancestor of HEAD")
    result = subprocess.run(["git", "merge-base", "--is-ancestor", ancestorCommitId, "HEAD"],
                cwd=repoPath, capture_output=True)
    return result.returncode == 0

def applyFixBackports(repoPath: Path, backportsJson: Path, logger: Logger) -> bool:
    """Apply fix backports from JSON file."""
    logger.info("Applying fix backports...")
    try:
        with open(backportsJson, 'r', encoding='utf-8') as fp:
            commits = json.load(fp)
        
        for commit in commits:
            if 'guilty_hash' in commit:
                if not checkAncestorByCommitId(repoPath, commit['guilty_hash'], logger):
                    logger.debug(f"Skipping commit {commit['guilty_hash']} - not an ancestor")
                    continue
                    
            fixCommit = getCommitIdByMessage(
                repoPath, canonicalizeCommitTitle(commit['fix_title']), logger)
            
            if isinstance(fixCommit, str):
                logger.debug(f"Fix already applied: {fixCommit}")
                continue
                
            cherryPickCmd = ['git', 'cherry-pick', '--no-commit']
            cherryPickCmd.extend(['--strategy-option'])
            
            if commit.get('force_merge', False):
                cherryPickCmd.append('theirs')
            else:
                cherryPickCmd.append('ours')
                
            if 'mainline' in commit:
                assert commit['mainline'] > 0
                cherryPickCmd.extend(['-m', str(commit['mainline'])])
                
            cherryPickCmd.append(commit['fix_hash'])
            
            logger.info(f"Applying fix: {commit['fix_hash']}")
            result = subprocess.run(cherryPickCmd, cwd=repoPath, capture_output=True)
            if result.returncode != 0:
                logger.error(f"Failed to apply fix: {result.stderr.decode()}")
                return False
        
        logger.info("Successfully applied all fix backports")
        return True
        
    except Exception as e:
        logger.error(f"Error applying fix backports: {e}")
        return False

def extractRelevantLines(crashReport: str) -> List[Tuple[str, str, Optional[str]]]:
    """
    Extract source code lines mentioned in a kernel crash report.
    Args:
        crashReport: The crash report text to analyze
    Returns:
        List of tuples containing (filePath, functionName, lineNumber)
        where line_number may be None if not present in the trace
    """
    regex = r"(\w+)(?:\+0x[0-9a-f]+/0x[0-9a-f]+)?\s+([a-zA-Z0-9/_.-]+\.(?:c|h|S))(?::(\d+))?\s*(?:\[inline\])?"
    matches = re.finditer(regex, crashReport)
    uniqueMatches = set((m.group(2), m.group(1), m.group(3)) for m in matches)
    return list(uniqueMatches)