"""
Queue Management System for Mathematical Model Evaluation

This module implements the global evaluation queue with enhanced prioritization,
global concurrency limits, and per-company limits.

Key Features:
- Global limit of 4 concurrent evaluations
- Per-company limit of 2 concurrent evaluations
- Priority order: Tier 1 attempt 1 > Tier 2 > Tier 3 > Tier 4 > Tier 1 attempt 2
- Improved cancellation handling with subprocess tracking
"""

import logging
import threading
from datetime import datetime, timedelta
from typing import Dict, List, Optional, Tuple, Any
from contextlib import contextmanager
from django.db import transaction, connection
from django.utils import timezone
from django.conf import settings
from asgiref.sync import sync_to_async

from .models import (
    EvaluationQueue, Model, Question, ModelTier, Company,
    ModelAttempt, CompanyExecutionLock, ExecutionTracker
)

logger = logging.getLogger(__name__)

# Global configuration
MAX_GLOBAL_CONCURRENT = 4  # Maximum total concurrent evaluations
MAX_COMPANY_CONCURRENT = 2  # Maximum concurrent evaluations per company


class QueueManager:
    """
    Manages the global evaluation queue with enhanced prioritization and limits.
    
    Key Features:
    - Custom priority ordering (Tier 1 attempt 1 > Tier 2 > Tier 3 > Tier 4 > Tier 1 attempt 2)
    - Global concurrency limit (4 evaluations max)
    - Per-company concurrency limit (2 evaluations max per company)
    - Automatic second attempt scheduling for Tier 1 models
    - Subprocess tracking for better cancellation handling
    """
    
    def __init__(self):
        """Initialize the queue manager."""
        self._lock = threading.RLock()  # Thread-safe operations
        logger.info("Queue manager initialized with global limit=%d, company limit=%d", 
                   MAX_GLOBAL_CONCURRENT, MAX_COMPANY_CONCURRENT)
    
    def add_to_queue(self, model: Model, question: Question) -> EvaluationQueue:
        """
        Add an evaluation to the queue using attempt-based architecture.
        
        Creates a model_attempt record first, then queues it for evaluation.
        For Tier 1 models, automatically creates and queues a second attempt.
        
        Args:
            model: Model to evaluate
            question: Question to evaluate
            
        Returns:
            Created EvaluationQueue object for the first attempt
        """
        with self._lock:
            try:
                with transaction.atomic():
                    # Check if attempt already exists and is queued/running
                    existing_attempt = ModelAttempt.objects.filter(
                        model=model,
                        question=question,
                        attempt_number=1
                    ).first()
                    
                    if existing_attempt:
                        existing_queue = EvaluationQueue.objects.filter(
                            attempt=existing_attempt
                        ).exclude(status='failed').first()
                        
                        if existing_queue:
                            logger.warning(f"Evaluation already exists: {existing_queue.id}")
                            return existing_queue
                    
                    # Create first attempt record
                    first_attempt = ModelAttempt.objects.create(
                        model=model,
                        question=question,
                        attempt_number=1,
                        time=timezone.now()
                    )
                    
                    # Queue the first attempt for evaluation
                    queue_item = EvaluationQueue.objects.create(
                        attempt=first_attempt,
                        status='pending',
                        submitted_at=timezone.now(),
                    )
                    
                    logger.info(f"Added to queue: Q{question.id} with {model.model_name} "
                              f"(tier {model.tier.tier_number}, attempt 1, queue ID {queue_item.id})")
                    
                    # For Tier 1 models, automatically create and queue second attempt
                    if model.tier.tier_number == 1:
                        second_attempt = ModelAttempt.objects.create(
                            model=model,
                            question=question,
                            attempt_number=2,
                            time=timezone.now()
                        )
                        
                        second_queue_item = EvaluationQueue.objects.create(
                            attempt=second_attempt,
                            status='pending',
                            submitted_at=timezone.now(),
                        )
                        
                        logger.info(f"Scheduled second attempt: Q{question.id} with {model.model_name} "
                                  f"(will run after Tier 4, queue ID {second_queue_item.id})")
                    
                    return queue_item
                    
            except Exception as e:
                logger.error(f"Error adding to queue: {str(e)}")
                raise
    
    def _get_effective_priority(self, queue_item: EvaluationQueue) -> int:
        """
        Calculate effective priority for queue ordering.
        
        Priority order:
        1. Tier 1, attempt 1
        2. Tier 2 (all attempts)
        3. Tier 3 (all attempts)  
        4. Tier 4 (all attempts)
        5. Tier 1, attempt 2
        
        Args:
            queue_item: Queue item to calculate priority for
            
        Returns:
            Priority value (lower = higher priority)
        """
        tier_number = queue_item.attempt.model.tier.tier_number
        attempt_number = queue_item.attempt.attempt_number
        
        # Special handling for Tier 1 second attempts
        if tier_number == 1 and attempt_number == 2:
            return 5  # Lowest priority
        
        # All other cases use tier number as priority
        return tier_number
    
    async def get_next_evaluation(self) -> Optional[EvaluationQueue]:
        """
        Get the next evaluation from the queue respecting all limits and priorities.
        
        Enforces:
        - Global limit of 4 concurrent evaluations
        - Per-company limit of 2 concurrent evaluations
        - Custom priority ordering
        
        Returns:
            Next queue item to process or None if no available work
        """
        with self._lock:
            try:
                logger.info("Getting next evaluation...")
                
                @sync_to_async
                def get_next_atomic():
                    with transaction.atomic():
                        # Check global limit
                        running_count = ExecutionTracker.objects.count()
                        if running_count >= MAX_GLOBAL_CONCURRENT:
                            logger.info(f"Global limit reached: {running_count}/{MAX_GLOBAL_CONCURRENT} running")
                            return None, {}
                        
                        # Get per-company running counts
                        company_counts = {}
                        for tracker in ExecutionTracker.objects.select_related('company').all():
                            company_id = tracker.company_id
                            company_counts[company_id] = company_counts.get(company_id, 0) + 1
                        
                        logger.info(f"Current running: {running_count} total, by company: {company_counts}")
                        
                        # Find companies that haven't reached their limit
                        available_companies = []
                        all_companies = Company.objects.all()
                        for company in all_companies:
                            current_count = company_counts.get(company.id, 0)
                            if current_count < MAX_COMPANY_CONCURRENT:
                                available_companies.append(company.id)
                        
                        if not available_companies:
                            logger.info("All companies at their limit")
                            return None, company_counts
                        
                        logger.info(f"Companies with capacity: {available_companies}")
                        
                        # Get all pending evaluations from available companies
                        pending_evaluations = EvaluationQueue.objects.select_for_update().select_related(
                            'attempt__model__tier',
                            'attempt__model__company',
                            'attempt__question'
                        ).filter(
                            status='pending',
                            attempt__model__company_id__in=available_companies
                        )
                        
                        # Sort by our custom priority, then by submission time
                        pending_list = list(pending_evaluations)
                        pending_list.sort(key=lambda x: (
                            self._get_effective_priority(x),
                            x.submitted_at
                        ))
                        
                        if pending_list:
                            next_evaluation = pending_list[0]
                            logger.info(f"Selected: Queue {next_evaluation.id}, "
                                      f"Tier {next_evaluation.attempt.model.tier.tier_number}, "
                                      f"Attempt {next_evaluation.attempt.attempt_number}, "
                                      f"Priority {self._get_effective_priority(next_evaluation)}")
                            return next_evaluation, company_counts
                        
                        logger.info("No pending evaluations for available companies")
                        return None, company_counts
                
                next_evaluation, company_counts = await get_next_atomic()
                
                if next_evaluation:
                    # Create execution tracker entry
                    success = await self._create_execution_tracker(next_evaluation)
                    if success:
                        # Mark as running
                        next_evaluation.status = 'running'
                        next_evaluation.started_at = timezone.now()
                        await sync_to_async(next_evaluation.save)(update_fields=['status', 'started_at'])
                        
                        logger.info(f"Assigned evaluation: Q{next_evaluation.attempt.question.id} "
                                  f"with {next_evaluation.attempt.model.model_name} "
                                  f"(attempt {next_evaluation.attempt.attempt_number}, "
                                  f"tier {next_evaluation.attempt.model.tier.tier_number}, "
                                  f"queue ID {next_evaluation.id})")
                        
                        return next_evaluation
                    else:
                        logger.error(f"Failed to create execution tracker for queue {next_evaluation.id}")
                        return None
                
                return None
                    
            except Exception as e:
                logger.error(f"Error getting next evaluation: {str(e)}")
                return None
    
    async def _create_execution_tracker(self, queue_item: EvaluationQueue) -> bool:
        """
        Create an execution tracker entry for the evaluation.
        
        Args:
            queue_item: Queue item to track
            
        Returns:
            True if tracker created successfully
        """
        try:
            await sync_to_async(ExecutionTracker.objects.create)(
                queue=queue_item,
                company=queue_item.attempt.model.company,
                model=queue_item.attempt.model,
                question=queue_item.attempt.question,
                attempt_number=queue_item.attempt.attempt_number,
                subprocess_pid=None,  # Will be updated when subprocess starts
                started_at=timezone.now()
            )
            logger.debug(f"Created execution tracker for queue {queue_item.id}")
            return True
        except Exception as e:
            logger.error(f"Error creating execution tracker: {str(e)}")
            return False
    
    async def update_subprocess_pid(self, queue_item: EvaluationQueue, pid: int) -> bool:
        """
        Update the subprocess PID in the execution tracker.
        
        Args:
            queue_item: Queue item being executed
            pid: Process ID of the subprocess
            
        Returns:
            True if updated successfully
        """
        try:
            @sync_to_async
            def update_pid():
                tracker = ExecutionTracker.objects.filter(queue=queue_item).first()
                if tracker:
                    tracker.subprocess_pid = pid
                    tracker.save(update_fields=['subprocess_pid'])
                    return True
                return False
            
            success = await update_pid()
            if success:
                logger.debug(f"Updated PID {pid} for queue {queue_item.id}")
            else:
                logger.warning(f"No tracker found for queue {queue_item.id}")
            return success
        except Exception as e:
            logger.error(f"Error updating subprocess PID: {str(e)}")
            return False
    
    async def release_execution_tracker(self, queue_item: EvaluationQueue) -> bool:
        """
        Release the execution tracker for a completed/failed evaluation.
        
        Args:
            queue_item: Queue item to release
            
        Returns:
            True if released successfully
        """
        with self._lock:
            try:
                @sync_to_async
                def release_tracker():
                    with transaction.atomic():
                        deleted_count = ExecutionTracker.objects.filter(queue=queue_item).delete()[0]
                        return deleted_count
                
                deleted_count = await release_tracker()
                
                if deleted_count > 0:
                    logger.info(f"Released execution tracker for queue {queue_item.id}")
                    return True
                else:
                    logger.debug(f"No tracker found to release for queue {queue_item.id}")
                    return False
                    
            except Exception as e:
                logger.error(f"Error releasing execution tracker: {str(e)}")
                return False
    
    async def complete_evaluation(
        self,
        queue_item: EvaluationQueue,
        success: bool,
        error_message: Optional[str] = None
    ) -> bool:
        """
        Mark evaluation as completed and release execution tracker.
        
        Args:
            queue_item: Queue item to complete
            success: Whether evaluation succeeded
            error_message: Error message if failed
            
        Returns:
            True if completed successfully
        """
        with self._lock:
            try:
                @sync_to_async
                def complete_atomic():
                    with transaction.atomic():
                        # Update queue item status
                        queue_item.status = 'completed' if success else 'failed'
                        queue_item.completed_at = timezone.now()
                        
                        if not success:
                            queue_item.error_message = error_message
                        
                        queue_item.save()
                
                await complete_atomic()
                
                # Release execution tracker
                await self.release_execution_tracker(queue_item)
                
                logger.info(f"Completed evaluation: attempt {queue_item.attempt.id}, "
                          f"queue ID {queue_item.id}, success: {success}")
                
                return True
                    
            except Exception as e:
                logger.error(f"Error completing evaluation: {str(e)}")
                return False
    
    async def handle_cancellation(self, queue_id: int) -> bool:
        """
        Handle cancellation of a running evaluation.
        
        This includes:
        - Marking the queue item as cancelled
        - Terminating the subprocess if running
        - Releasing the execution tracker
        
        Args:
            queue_id: ID of the queue item to cancel
            
        Returns:
            True if cancelled successfully
        """
        try:
            import os
            import signal
            
            @sync_to_async
            def cancel_atomic():
                with transaction.atomic():
                    # Get the queue item
                    queue_item = EvaluationQueue.objects.filter(id=queue_id).first()
                    if not queue_item:
                        logger.warning(f"Queue item {queue_id} not found")
                        return None, None
                    
                    # Get the execution tracker
                    tracker = ExecutionTracker.objects.filter(queue_id=queue_id).first()
                    
                    # Update queue status
                    queue_item.status = 'cancelled'
                    queue_item.completed_at = timezone.now()
                    queue_item.error_message = 'Cancelled by user'
                    queue_item.save()
                    
                    return queue_item, tracker
            
            queue_item, tracker = await cancel_atomic()
            
            if not queue_item:
                return False
            
            # Terminate subprocess if it exists
            if tracker and tracker.subprocess_pid:
                try:
                    logger.info(f"Terminating subprocess {tracker.subprocess_pid} for queue {queue_id}")
                    os.kill(tracker.subprocess_pid, signal.SIGTERM)
                    # Give it time to terminate gracefully
                    await asyncio.sleep(2)
                    # Force kill if still running
                    try:
                        os.kill(tracker.subprocess_pid, signal.SIGKILL)
                    except ProcessLookupError:
                        pass  # Process already terminated
                except ProcessLookupError:
                    logger.info(f"Subprocess {tracker.subprocess_pid} already terminated")
                except Exception as e:
                    logger.error(f"Error terminating subprocess: {str(e)}")
            
            # Release the execution tracker
            if tracker:
                await self.release_execution_tracker(queue_item)
            
            logger.info(f"Successfully cancelled evaluation queue {queue_id}")
            return True
            
        except Exception as e:
            logger.error(f"Error handling cancellation for queue {queue_id}: {str(e)}")
            return False
    
    def get_queue_status(self) -> Dict[str, Any]:
        """
        Get comprehensive queue status information.
        
        Returns:
            Dictionary with queue statistics
        """
        try:
            status = {
                'pending': EvaluationQueue.objects.filter(status='pending').count(),
                'running': EvaluationQueue.objects.filter(status='running').count(),
                'completed': EvaluationQueue.objects.filter(status='completed').count(),
                'failed': EvaluationQueue.objects.filter(status='failed').count(),
                'cancelled': EvaluationQueue.objects.filter(status='cancelled').count(),
            }
            
            # Add running evaluation details
            status['running_details'] = []
            for tracker in ExecutionTracker.objects.select_related(
                'company', 'model', 'question', 'queue'
            ).all():
                status['running_details'].append({
                    'queue_id': tracker.queue_id,
                    'company': tracker.company.company_name,
                    'model': tracker.model.model_name,
                    'question_id': tracker.question_id,
                    'attempt': tracker.attempt_number,
                    'pid': tracker.subprocess_pid,
                    'started_at': tracker.started_at.isoformat() if tracker.started_at else None,
                })
            
            # Add per-company counts
            status['company_counts'] = {}
            for tracker in ExecutionTracker.objects.select_related('company').all():
                company_name = tracker.company.company_name
                status['company_counts'][company_name] = status['company_counts'].get(company_name, 0) + 1
            
            # Add limits
            status['limits'] = {
                'global_max': MAX_GLOBAL_CONCURRENT,
                'global_current': len(status['running_details']),
                'company_max': MAX_COMPANY_CONCURRENT,
            }
            
            # Add tier breakdown with custom priority
            status['pending_by_priority'] = {}
            pending_items = EvaluationQueue.objects.filter(
                status='pending'
            ).select_related('attempt__model__tier')
            
            for item in pending_items:
                priority = self._get_effective_priority(item)
                tier = item.attempt.model.tier.tier_number
                attempt = item.attempt.attempt_number
                
                if tier == 1 and attempt == 2:
                    key = 'tier_1_attempt_2'
                else:
                    key = f'tier_{tier}'
                
                if key not in status['pending_by_priority']:
                    status['pending_by_priority'][key] = {
                        'count': 0,
                        'priority': priority
                    }
                status['pending_by_priority'][key]['count'] += 1
            
            return status
            
        except Exception as e:
            logger.error(f"Error getting queue status: {str(e)}")
            return {'error': str(e)}
    
    def cleanup_stale_trackers(self, max_age_hours: int = 3) -> int:
        """
        Clean up stale execution trackers (older than max_age_hours).
        
        This handles cases where evaluations were cancelled or crashed
        without proper cleanup.
        
        Args:
            max_age_hours: Maximum age for trackers in hours
            
        Returns:
            Number of trackers cleaned up
        """
        with self._lock:
            try:
                cutoff_time = timezone.now() - timedelta(hours=max_age_hours)
                
                # Find stale trackers
                stale_trackers = ExecutionTracker.objects.filter(
                    started_at__lt=cutoff_time
                ).select_related('company', 'queue')
                
                count = 0
                for tracker in stale_trackers:
                    logger.warning(f"Cleaning up stale tracker for queue {tracker.queue_id} "
                                 f"({tracker.company.company_name}, started {tracker.started_at})")
                    
                    # Update queue status if it's still running
                    if tracker.queue and tracker.queue.status == 'running':
                        tracker.queue.status = 'failed'
                        tracker.queue.error_message = 'Evaluation timed out (stale tracker cleanup)'
                        tracker.queue.completed_at = timezone.now()
                        tracker.queue.save()
                    
                    count += 1
                
                # Delete all stale trackers
                if count > 0:
                    ExecutionTracker.objects.filter(
                        started_at__lt=cutoff_time
                    ).delete()
                
                # Also clean up old company locks if they still exist
                try:
                    old_locks = CompanyExecutionLock.objects.filter(
                        locked_at__lt=cutoff_time
                    ).delete()[0]
                    if old_locks > 0:
                        logger.info(f"Cleaned up {old_locks} old company locks")
                except:
                    pass  # Table might not exist anymore
                
                return count
                
            except Exception as e:
                logger.error(f"Error cleaning up stale trackers: {str(e)}")
                return 0
    
    def bulk_add_evaluations(
        self,
        model_question_pairs: List[Tuple[Model, Question]]
    ) -> List[EvaluationQueue]:
        """
        Add multiple evaluations to the queue efficiently.
        
        Args:
            model_question_pairs: List of (model, question) tuples
            
        Returns:
            List of created queue items
        """
        with self._lock:
            created_items = []
            
            try:
                with transaction.atomic():
                    for model, question in model_question_pairs:
                        try:
                            queue_item = self.add_to_queue(model, question)
                            created_items.append(queue_item)
                        except Exception as e:
                            logger.error(f"Error adding {model.model_name} x Q{question.id}: {str(e)}")
                
                logger.info(f"Bulk added {len(created_items)} evaluations to queue")
                return created_items
                
            except Exception as e:
                logger.error(f"Error in bulk add: {str(e)}")
                return created_items


# Global queue manager instance
queue_manager = QueueManager()


# Context manager for safe queue operations
@contextmanager
def queue_transaction():
    """Context manager for safe queue operations with automatic cleanup."""
    try:
        yield queue_manager
    except Exception as e:
        logger.error(f"Queue operation failed: {str(e)}")
        raise
    finally:
        # Cleanup any stale trackers on errors
        queue_manager.cleanup_stale_trackers(max_age_hours=1)


# Convenience functions
def add_evaluation(model: Model, question: Question, **kwargs) -> EvaluationQueue:
    """Add a single evaluation to the queue."""
    return queue_manager.add_to_queue(model, question, **kwargs)


async def get_next_work() -> Optional[EvaluationQueue]:
    """Get the next evaluation to process."""
    return await queue_manager.get_next_evaluation()


async def complete_work(queue_item: EvaluationQueue, success: bool, error: str = None) -> bool:
    """Complete an evaluation."""
    return await queue_manager.complete_evaluation(queue_item, success, error)


async def cancel_evaluation(queue_id: int) -> bool:
    """Cancel a running evaluation."""
    return await queue_manager.handle_cancellation(queue_id)


def get_queue_stats() -> Dict[str, Any]:
    """Get queue statistics."""
    return queue_manager.get_queue_status()