"""
Core document QA workflow implementation
"""

import queue
import threading
import time
import logging
from typing import Callable, Dict, Iterator, List, Optional

from langchain.llms.base import BaseLLM

import llm.main as llm_main
import llm.global_config as llm_config
from core.state import DocumentQAState
from core.document_manager import DocumentManager
from CycleIE.agents.workflow_control import WorkflowControl
from utils.llm_utils import get_llm_response

logger = logging.getLogger(__name__)

def stream_document_qa_workflow(query: str, documents: List[str], doc_mode: str = "paths",
                               llm: Optional[BaseLLM] = None, 
                               model: str = "qwen2-72b-instruct", 
                               custom_params: Dict = None,
                               callback: Optional[Callable[[str], None]] = None,
                               task_mode: str = "original") -> Iterator[str]:
    """Execute the document QA workflow using the multi-agent system and stream results.
    
    This function is the streaming version of execute_document_qa_workflow. It yields
    intermediate thoughts and the final answer as they are generated, allowing for
    real-time display of the reasoning process.
    
    Args:
        query: The user query to process
        document: List of document paths to use for answering the query
        doc_mode: str = "paths" or "contents"
        llm: Optional language model instance to use
        model: Model name to use if llm is not provided
        custom_params: Additional parameters for document processing
        callback: Optional callback function to receive thoughts in real-time
        task_mode: str = "original" or "wo_verify" or "wo_extract"
    Returns:
        An iterator that yields thoughts and the final answer as strings
    """
    
    # Set the model in global config if specified
    if model:
        llm_config.set_model(model)
    
    # Create a queue for streaming
    thought_queue = queue.Queue()
    
    def streaming_callback(thought, temporary=False):
        """This callback function puts each thinking step into the queue to be yielded immediately
        
        Args:
            thought: The thought content
            temporary: If True, this is a temporary status message that should be hidden when new messages arrive
        """
        # Put into queue for immediate availability
        thought_queue.put((thought, temporary))  # Store tuple with thought content and temporary flag
        logger.info(f"Added thought to queue: {thought[:50]}... {'(temporary thought)' if temporary else '(regular thought)'}")
        if callback:
            # Pass the temporary flag to the client callback if it supports it
            try:
                # Try with temporary flag
                if temporary:
                    logger.info(f"Calling callback with temporary flag: {thought[:50]}...")
                else:
                    logger.info(f"Calling regular thought callback: {thought[:50]}...")
                    
                callback(thought, temporary=temporary)
            except TypeError:
                # Fall back to original signature if callback doesn't accept the temporary parameter
                logger.warning(f"Callback doesn't support temporary flag parameter, using default callback: {thought[:50]}...")
                callback(thought)
    
    # Create state with streaming capability
    state = DocumentQAState(callback=streaming_callback)
    
    # Return the first items to start the stream
    yield f"Starting analysis for query: {query}\n"
    
    # Handle case with empty document list
    if not documents:
        # Immediately yield thoughts from the queue
        while not thought_queue.empty():
            thought_data = thought_queue.get()
            # Extract thought content from tuple
            if isinstance(thought_data, tuple) and len(thought_data) > 0:
                thought = thought_data[0]
            else:
                thought = thought_data
            yield thought if isinstance(thought, str) else str(thought)
            
        # Directly use LLM to answer without document retrieval
        prompt = f"""Please answer the following question based on your own knowledge. Note that the user has not selected any reference documents, 
        so you should rely on your own knowledge to respond. Also, kindly inform the user that if they wish to receive an answer based on specific documents, 
        they should select the relevant documents and ask the question again.

        Question: {query}
        """
        answer = get_llm_response(prompt, model="qwen2-72b-instruct")
        
        # Ensure all thoughts have been yielded
        while not thought_queue.empty():
            thought_data = thought_queue.get()
            # Extract thought content from tuple
            if isinstance(thought_data, tuple) and len(thought_data) > 0:
                thought = thought_data[0]
            else:
                thought = thought_data
            yield thought if isinstance(thought, str) else str(thought)
        
        # Yield the final answer
        yield "FINAL ANSWER:"
        yield answer
        return
    
    # If documents are selected, process them normally
    # Prioritize using the pre-loaded doc_manager if provided
    yield "Loading and processing documents...\n"

    if doc_mode == "paths":
        if custom_params and "doc_manager" in custom_params:
            doc_manager = custom_params["doc_manager"]
            logger.info("Using pre-loaded DocumentManager")
        else:
            doc_manager = DocumentManager(**(custom_params or {}))
            logger.info("Creating new DocumentManager")
    else:
        doc_manager = DocumentManager(**(custom_params or {}))
        logger.info("Creating new DocumentManager")
    
    # Initialize the thinking agent
    workflow_control = WorkflowControl(state, doc_manager, llm)
    
    # Load and index documents
    if doc_mode == "paths":
        documents_ctx = doc_manager.load_documents(documents)
    elif doc_mode == "contents":
        documents_ctx = documents
    
    # Immediately yield thoughts from the queue
    while not thought_queue.empty():
        thought_data = thought_queue.get()
        # Extract thought content from tuple
        if isinstance(thought_data, tuple) and len(thought_data) > 0:
            thought = thought_data[0]
            is_temporary = thought_data[1] if len(thought_data) > 1 else False
        else:
            thought = thought_data
            is_temporary = False
        
        # Only yield non-temporary thoughts for final output
        if not is_temporary:
            yield thought if isinstance(thought, str) else str(thought)
    
    if not documents_ctx:
        yield "Could not load documents. Please check if the document paths and formats are correct."
        return
    
    # Create or update index - only when not using a pre-loaded doc_manager
    if doc_mode == "paths":
        if not custom_params or "doc_manager" not in custom_params:
            existing_index = doc_manager.load_faiss_index()
            if existing_index:
                doc_manager.add_documents(documents_ctx)
            else:
                doc_manager.index_documents(documents_ctx)
        else:
            doc_manager.add_documents(documents_ctx)
    
    # Immediately yield thoughts from the queue
    while not thought_queue.empty():
        thought_data = thought_queue.get()
        # Extract thought content from tuple
        if isinstance(thought_data, tuple) and len(thought_data) > 0:
            thought = thought_data[0]
            is_temporary = thought_data[1] if len(thought_data) > 1 else False
        else:
            thought = thought_data
            is_temporary = False
        
        # Only yield non-temporary thoughts for final output
        if not is_temporary:
            yield thought if isinstance(thought, str) else str(thought)
    
    # Execute the workflow using the thinking agent - pass document_paths
    try:
        # Begin execution with the thinking agent
        yield "Beginning analysis using ThinkingAgent...\n"
        
        # Special handling for different document modes
        if doc_mode == "contents":
            # If we're using document content directly instead of paths
            result = workflow_control.execute(query, documents=documents_ctx, doc_mode=doc_mode)
        else:
            # Default mode using document paths
            result = workflow_control.execute(query, documents=documents, doc_mode=doc_mode)
        
        # Yield all remaining thoughts
        while not thought_queue.empty():
            thought_data = thought_queue.get()
            # Extract thought content from tuple
            if isinstance(thought_data, tuple) and len(thought_data) > 0:
                thought = thought_data[0]
                is_temporary = thought_data[1] if len(thought_data) > 1 else False
            else:
                thought = thought_data
                is_temporary = False
            
            # Only yield non-temporary thoughts for final output
            if not is_temporary:
                yield thought if isinstance(thought, str) else str(thought)
        
        # Yield the final answer
        yield "\n\nFINAL ANSWER:"
        yield result
        
    except Exception as e:
        logger.error(f"Error during document QA execution: {str(e)}")
        # Yield error message
        yield f"Error during document analysis: {str(e)}"
        # Yield any remaining thoughts in the queue
        while not thought_queue.empty():
            thought_data = thought_queue.get()
            if isinstance(thought_data, tuple) and len(thought_data) > 0:
                thought = thought_data[0]
            else:
                thought = thought_data
            yield thought if isinstance(thought, str) else str(thought)

def execute_document_qa_workflow(query: str, documents: List[str], doc_mode: str = "paths",
                               llm: Optional[BaseLLM] = None, 
                               model: str = "qwen2-72b-instruct", 
                               custom_params: Dict = None,
                               callback: Optional[Callable[[str], None]] = None,
                               task_mode: str = "original") -> Dict:
    """Execute the document QA workflow using the multi-agent system.
    
    This function processes the user query and documents to generate an answer.
    
    Args:
        query: The user query to process
        documents: List of document paths to use for answering the query
        doc_mode: str = "paths" or "contents"
        llm: Optional language model instance to use
        model: Model name to use if llm is not provided
        custom_params: Additional parameters for document processing
        callback: Optional callback function to receive thoughts in real-time
        task_mode: str = "original" or "wo_verify" or "wo_extract"
    Returns:
        Dict containing the answer and thought process
    """
    
    # Set the model in global config if specified
    if model:
        llm_config.set_model(model)
    
    # Create state with callback
    state = DocumentQAState(callback=callback)
    
    # Handle empty document list
    if not documents:
        prompt = f"""Please answer the following question based on your own knowledge. Note that the user has not selected any reference documents, 
        so you should rely on your own knowledge to respond. Also, kindly inform the user that if they wish to receive an answer based on specific documents, 
        they should select the relevant documents and ask the question again.

        Question: {query}
        """
        answer = get_llm_response(prompt, model="qwen2-72b-instruct")
        
        return {
            "answer": answer,
            "thought_process": "No documents provided. Using model's knowledge to answer."
        }
    
    # Initialize document manager
    if doc_mode == "paths":
        if custom_params and "doc_manager" in custom_params:
            doc_manager = custom_params["doc_manager"]
        else:
            doc_manager = DocumentManager(**(custom_params or {}))
    else:
        doc_manager = DocumentManager(**(custom_params or {}))
    
    # Initialize the thinking agent
    workflow_control = WorkflowControl(state, doc_manager, llm)
    
    # Load and index documents
    if doc_mode == "paths":
        documents_ctx = doc_manager.load_documents(documents)
        
        if not documents_ctx:
            return {
                "answer": "Could not load documents. Please check if the document paths and formats are correct.",
                "thought_process": "Error loading documents."
            }
        
        # Create or update index
        if not custom_params or "doc_manager" not in custom_params:
            existing_index = doc_manager.load_faiss_index()
            if existing_index:
                doc_manager.add_documents(documents_ctx)
            else:
                doc_manager.index_documents(documents_ctx)
        else:
            doc_manager.add_documents(documents_ctx)
    
    # Execute the workflow
    try:
        if doc_mode == "contents":
            result = workflow_control.execute(query, documents=documents, doc_mode=doc_mode)
        else:
            result = workflow_control.execute(query, documents=documents, doc_mode=doc_mode)
        
        # Get the thought process
        thought_process = state.get_thought_trail()
        
        return {
            "answer": result,
            "thought_process": thought_process
        }
    except Exception as e:
        logger.error(f"Error during document QA execution: {str(e)}")
        return {
            "answer": f"Error during document analysis: {str(e)}",
            "thought_process": state.get_thought_trail()
        } 