#!/usr/bin/env python3
"""
Question Answering Module with Topological Graph Integration

This module provides question answering capabilities using the 32B model with two modes:
1. Standard QA: Question only
2. Enhanced QA: Question + Topological Graph for structured reasoning
"""

import os
import json
import asyncio
import aiohttp
import time
import pandas as pd
import networkx as nx
from typing import List, Dict, Any, Tuple, Optional
from dotenv import load_dotenv
from .context_retrievers import (
    BaseContextRetriever, 
    DataRetrievalContextRetriever, 
    TopologicalGraphContextRetriever,
    NoContextRetriever
)
load_dotenv()

VLLM_TEXT_URL = os.getenv("VLLM_QWEN_32B_URL")
DEFAULT_TEXT_MODEL = os.getenv("VLLM_QWEN_32B_MODEL")

class QuestionAnswerer:
    """Question answering with modular context retrieval strategies"""
    
    def __init__(self, model_config: Dict[str, Any] = None, 
                 context_retriever: BaseContextRetriever = None):
        self.model_config = model_config or {
            'base_url': VLLM_TEXT_URL,
            'model_name': DEFAULT_TEXT_MODEL,
            'max_tokens': 2048,
            'temperature': 0.7
        }
        self.session = None
        self.context_retriever = context_retriever or NoContextRetriever()
    
    async def __aenter__(self):
        self.session = aiohttp.ClientSession()
        return self
    
    async def __aexit__(self, exc_type, exc_val, exc_tb):
        if self.session:
            await self.session.close()
    
    def load_topological_graph(self, graph_dir: str) -> Tuple[List[str], Dict[int, List[str]], Dict[str, int]]:
        """Load topological graph data"""
        print("📊 Loading topological graph...")
        
        # Load hierarchy
        hierarchy_path = os.path.join(graph_dir, "hierarchy.parquet")
        if not os.path.exists(hierarchy_path):
            print("❌ Hierarchy file not found")
            return [], {}, {}
        
        hierarchy_df = pd.read_parquet(hierarchy_path)
        hierarchy = {}
        for _, row in hierarchy_df.iterrows():
            level = row['level']
            node = row['node']
            if level not in hierarchy:
                hierarchy[level] = []
            hierarchy[level].append(node)
        
        # Load node mapping
        mapping_path = os.path.join(graph_dir, "node_mapping.parquet")
        node_mapping = {}
        if os.path.exists(mapping_path):
            mapping_df = pd.read_parquet(mapping_path)
            for _, row in mapping_df.iterrows():
                node_mapping[row['original_node']] = row['representative_node']
        
        # Load sorted nodes
        sorted_path = os.path.join(graph_dir, "topological_sort.parquet")
        sorted_nodes = []
        if os.path.exists(sorted_path):
            sorted_df = pd.read_parquet(sorted_path)
            sorted_nodes = sorted_df['node'].tolist()
        
        print(f"   Loaded hierarchy with {len(hierarchy)} levels")
        print(f"   Loaded {len(sorted_nodes)} sorted nodes")
        print(f"   Loaded {len(node_mapping)} node mappings")
        
        return sorted_nodes, hierarchy, node_mapping
    
    def create_standard_prompt(self, question: str, use_thinking: bool = False) -> str:
        """Create simplified standard question answering prompt"""
        if use_thinking:
            thinking_instruction = """
<think>
[Your step-by-step reasoning here]
</think>

"""
            return f"""Question: {question}{thinking_instruction}

Answer:"""
        else:
            # Add </think></think> to block thinking mode
            return f"""Question: {question}

</think></think>

Answer:"""
    
    def create_context_prompt(self, question: str, context: Dict[str, Any], use_thinking: bool = False, simple_prompt: bool = False) -> str:
        """Create prompt with retrieved context"""
        method = context.get('method', 'unknown')
        
        if method == 'data_retrieval':
            if simple_prompt:
                return self._create_simple_data_retrieval_prompt(question, context, use_thinking)
            else:
                return self._create_data_retrieval_prompt(question, context, use_thinking)
        elif method == 'topological_graph':
            return self._create_topological_graph_prompt(question, context, use_thinking)
        elif method == 'hybrid':
            return self._create_hybrid_prompt(question, context, use_thinking)
        else:
            # Fallback to standard prompt
            return self.create_standard_prompt(question, use_thinking)
    
    def _create_data_retrieval_prompt(self, question: str, context: Dict[str, Any], use_thinking: bool = False) -> str:
        """Create prompt with data retrieval context"""
        chunks = context.get('chunks', [])
        
        if not chunks:
            return self.create_standard_prompt(question, use_thinking)
        
        # Build context from retrieved chunks (dynamically fit as many as possible)
        context_text = "RELEVANT CONTEXT:\n"
        max_chars_per_chunk = 1200  # Increased from 800 to 1200 characters per chunk
        max_total_context_chars = 30000  # Increased from 12000 to 25000 characters (80% of context window)
        
        total_chars_used = 0
        chunks_used = 0
        
        for i, chunk in enumerate(chunks, 1):
            content = chunk.get('content', '')
            score = chunk.get('score', 0)
            
            # Truncate content if too long
            if len(content) > max_chars_per_chunk:
                content = content[:max_chars_per_chunk] + "..."
            
            # Calculate how many characters this chunk would add
            chunk_text = f"{i}. [Score: {score:.3f}] {content}\n\n"
            chunk_chars = len(chunk_text)
            
            # Check if adding this chunk would exceed the limit
            if total_chars_used + chunk_chars > max_total_context_chars:
                print(f"   📊 Stopped at {chunks_used} chunks due to character limit")
                break
            
            context_text += chunk_text
            total_chars_used += chunk_chars
            chunks_used += 1
        
        print(f"   📊 Used {chunks_used} chunks ({total_chars_used} characters)")
        
        thinking_instruction = ""
        if use_thinking:
            thinking_instruction = """
<think>
[Your step-by-step reasoning here]
</think>

"""
        # Disabled for now - always use empty thinking instruction
        thinking_instruction = ""
        
        return f"""You are an expert qualitative analyst whose sole mandate is to exhaustively mine the provided text chunks and deliver a response that is unambiguously comprehensive, empowering, and direct.

INSTRUCTIONS – READ IN ORDER, NO OMISSIONS

1. Pre-Processing Commitment
   - Silently ingest and fully parse every one of the chunks before producing even a single sentence of output.
   - Keep an internal running tally of every discrete concept, example, contradiction, metaphor, statistic, stakeholder voice, and context-bound condition you encounter.

2. Thematic Cartography
   - Identify, label, and inter-relate ALL recurring and anomalous patterns across the chunks.  
     → Use short, memorable code names (e.g., "Trust-Deficit," "Resource-Scarcity Loop," "Shadow-Incentive").  
   - Map how these patterns amplify, attenuate, collide with, or transform one another.  
   - Explicitly flag which patterns are dominant, latent, or context-contingent.

3. Evidence Harvesting Rules (must appear verbatim in final answer)
   - Quote at least one representative passage from a minimum of 10 different chunks; include chunk ID in brackets [n].  
   - For each quote, annotate WHY it matters to the research question (one sentence max).  
   - Provide at least two counter-examples or limiting conditions drawn from separate chunks.

4. Conceptual Framework Construction
   - Create a concise, reusable framework (≤120 words) that captures the causal or configurational logic you discovered.  
   - Name the framework and present it in bold.  
   - Illustrate the framework with one micro-case drawn from the chunks.

5. Response Architecture (use these exact headings)
   A. Direct Answer – Begin with a single, declarative paragraph that answers the question without hedging.  
   B. Comprehensive Pattern Atlas – A table with three columns: Pattern Name | Core Evidence (quote + chunk ID) | Interaction Notes.  
   C. Framework & Micro-Case – Bolded framework followed by a 3-sentence vignette.  
   D. Counter-Evidence & Boundary Conditions – Bullet list of 2–3 items.  
   E. Actionable Implications – Numbered list of 3–5 concrete steps a practitioner could implement tomorrow, each tied back to a specific pattern.

6. Tone & Style
   - Zero fluff.  
   - Use signal verbs: "demonstrates," "undercuts," "reinforces," "renders ambiguous," etc.  
   - Where numeric data appear in the chunks, translate them into qualitative meaning rather than re-stating the number.

7. Final Compliance Check
   - Before output, verify:  
     □ At least 10 chunks explicitly cited  
     □ Framework present and bolded  
     □ Direct answer given in first paragraph  
     □ Counter-evidence included  
     □ Implications actionable and specific

# Thinking process disabled for now

IMPORTANT: Do not use thinking mode, step-by-step reasoning, or meta-commentary. Provide a direct answer immediately.

Relevant Materials:
{context_text}

Question:
{question}"""
    
    def _create_simple_data_retrieval_prompt(self, question: str, context: Dict[str, Any], use_thinking: bool = False) -> str:
        """Create a simplified prompt with data retrieval context for baseline comparison"""
        chunks = context.get('chunks', [])
        
        if not chunks:
            return self.create_standard_prompt(question, use_thinking)
        
        # Build simple context from retrieved chunks
        context_text = "Context:\n"
        max_chars_per_chunk = 1200  # Increased from 800 to 1200 characters per chunk
        max_total_context_chars = 50000  # Increased from 12000 to 25000 characters (80% of context window)
        
        total_chars_used = 0
        chunks_used = 0
        
        for i, chunk in enumerate(chunks, 1):
            content = chunk.get('content', '')
            score = chunk.get('score', 0)
            
            # Truncate content if too long
            if len(content) > max_chars_per_chunk:
                content = content[:max_chars_per_chunk] + "..."
            
            # Calculate how many characters this chunk would add
            chunk_text = f"{i}. [Score: {score:.3f}] {content}\n\n"
            chunk_chars = len(chunk_text)
            
            # Check if adding this chunk would exceed the limit
            if total_chars_used + chunk_chars > max_total_context_chars:
                print(f"   📊 Stopped at {chunks_used} chunks due to character limit")
                break
            
            context_text += chunk_text
            total_chars_used += chunk_chars
            chunks_used += 1
        
        print(f"   📊 Used {chunks_used} chunks ({total_chars_used} characters)")
        
        # Simple prompt without complex instructions and NO thinking
        return f"""You are an expert qualitative analyst.  
Your single mandate is to exhaustively mine the provided text chunks and deliver a response that is unambiguously comprehensive, empowering, and direct.

Use this format:
A. Direct Answer – Begin with a single, declarative paragraph that answers the question without hedging.
B. Comprehensive Pattern Atlas – A table with three columns: Pattern Name | Core Evidence (quote + chunk ID) | Interaction Notes.
C. Framework & Micro-Case
D. Counter-Evidence & Boundary Conditions
E. Actionable Implication

Rules
- Quote different chunks; include chunk ID in brackets [n].  
- No thinking process, meta-commentary, or step-by-step reasoning.

Relevant Materials:
{context_text}

Question:
{question}

Answer:"""
    
    def _create_topological_graph_prompt(self, question: str, context: Dict[str, Any], use_thinking: bool = False) -> str:
        """Create prompt with topological graph context"""
        hierarchy = context.get('hierarchy', {})
        graph_summary = context.get('graph_summary', '')
        
        if not hierarchy and not graph_summary:
            return self.create_standard_prompt(question, use_thinking)
        
        # Build context from graph structure
        context_text = "KNOWLEDGE GRAPH CONTEXT:\n"
        
        if graph_summary:
            context_text += f"{graph_summary}\n\n"
        
        thinking_instruction = ""
        if use_thinking:
            thinking_instruction = """
<think>
[Your step-by-step reasoning here]
</think>

"""
        # Disabled for now - always use empty thinking instruction
        thinking_instruction = ""
        
        return f"""{context_text}
Question: {question}{thinking_instruction}

Answer:"""
    
    def _create_hybrid_prompt(self, question: str, context: Dict[str, Any], use_thinking: bool = False) -> str:
        """Create prompt with hybrid context"""
        retriever_results = context.get('retriever_results', [])
        
        if not retriever_results:
            return self.create_standard_prompt(question, use_thinking)
        
        # Combine context from multiple retrievers
        context_text = "COMBINED CONTEXT:\n"
        
        for result in retriever_results:
            method = result.get('method', 'unknown')
            weight = result.get('weight', 1.0)
            
            if method == 'data_retrieval':
                chunks = result.get('chunks', [])
                if chunks:
                    context_text += f"DATA RETRIEVAL (Weight: {weight:.2f}):\n"
                    for i, chunk in enumerate(chunks[:3], 1):  # Limit to top 3 chunks
                        content = chunk.get('content', '')[:200]  # Truncate content
                        score = chunk.get('score', 0)
                        context_text += f"  {i}. [Score: {score:.3f}] {content}...\n"
                    context_text += "\n"
            
            elif method == 'topological_graph':
                hierarchical_context = result.get('hierarchical_context', {})
                if hierarchical_context:
                    context_text += f"TOPOLOGICAL GRAPH (Weight: {weight:.2f}):\n"
                    for level, summary in list(hierarchical_context.items())[:3]:  # Limit to top 3 levels
                        context_text += f"  Level {level}: {summary[:200]}...\n"
                    context_text += "\n"
        
        thinking_instruction = ""
        if use_thinking:
            thinking_instruction = """
<think>
[Your step-by-step reasoning here]
</think>

"""
        # Disabled for now - always use empty thinking instruction
        thinking_instruction = ""
        
        return f"""{context_text}
Question: {question}{thinking_instruction}

Answer:"""

    # def create_enhanced_prompt(self, question: str, hierarchy: Dict[int, List[str]], 
    #                              use_thinking: bool = False) -> str:
    #     """Create enhanced prompt with topological graph integration"""
        
    #     # Create hierarchical structure text with better organization
    #     hierarchy_text = "HIERARCHICAL CONCEPT STRUCTURE:\n\n"
        
    #     for level in sorted(hierarchy.keys()):
    #         nodes = hierarchy[level]
    #         hierarchy_text += f"Level {level} (Base Concepts):\n"
    #         for node in nodes:
    #             hierarchy_text += f"  • {node}\n"
    #         hierarchy_text += "\n"
        
    #     # Add instructions for using the knowledge structure
    #     instructions = """
    # INSTRUCTIONS:
    # 1. Use the hierarchical concept structure to understand the key themes and relationships
    # 2. Leverage the base concepts (Level 0) to identify fundamental principles
    # 3. Consider how higher-level concepts build upon and organize the base concepts
    # 4. Provide specific examples and references from the concept structure
    # 5. Structure your response to reflect the hierarchical organization of knowledge
    # 6. Make your answer comprehensive and convincing by incorporating relevant concepts

    # Please provide a detailed answer that:
    # 1. Addresses the core aspects of the question using the conceptual framework
    # 2. Shows understanding of how concepts relate to each other hierarchically
    # 3. Provides practical insights grounded in the structured knowledge
    # 4. Uses clear, organized structure that reflects the conceptual relationships
    # 5. References relevant concepts from the hierarchy where appropriate
    # 6. Includes specific examples and evidence to support your points"""
        
    #     if use_thinking:
    #         thinking_instruction = """
    # <think>
    # [Your step-by-step reasoning here, analyzing the hierarchical structure and how it relates to the question]
    # </think>

    # """
    #         return f"""Question: {question}

    # {hierarchy_text}

    # {instructions}

    # Answer:{thinking_instruction}"""
    #     else:
    #         # Add </think></think> to block thinking mode
    #         return f"""Question: {question}

    # {hierarchy_text}

    # {instructions}

    # </think></think>

    # Answer:"""

    # def create_enhanced_prompt(self, question: str, hierarchy: Dict[int, List[str]], 
    #                       use_thinking: bool = False, hierarchical_context: Dict[int, str] = None) -> str:
    #     """Create enhanced prompt with hierarchical structure integration and context"""
        
    #     # Create hierarchical structure text with better organization
    #     hierarchy_text = "HIERARCHICAL CONCEPT STRUCTURE WITH CONTEXT:\n\n"
        
    #     max_level = max(hierarchy.keys()) if hierarchy else 0
        
    #     for level in sorted(hierarchy.keys()):
    #         nodes = hierarchy[level]
    #         context = hierarchical_context.get(level, "") if hierarchical_context else ""
            
    #         # Describe the level based on its position in hierarchy
    #         if level == 0:
    #             level_description = "Level 0 (Foundation Concepts - Most Specific):"
    #         elif level == max_level:
    #             level_description = f"Level {level} (Abstract Concepts - Most General):"
    #         else:
    #             level_description = f"Level {level} (Intermediate Concepts):"
                
    #         hierarchy_text += f"{level_description}\n"
    #         for node in nodes:
    #             hierarchy_text += f"  • {node}\n"
            
    #         if context:
    #             hierarchy_text += f"\nContext for Level {level}:\n{context}\n"
            
    #         hierarchy_text += "\n"
        
    #     # Create conceptual flow explanation
    #     conceptual_flow = "CONCEPTUAL ORGANIZATION:\n\n"
    #     conceptual_flow += "📍 FOUNDATION → INTERMEDIATE → ABSTRACT FLOW:\n"
    #     conceptual_flow += "• Foundation concepts (Level 0) are the building blocks - specific, concrete ideas\n"
    #     conceptual_flow += "• Intermediate concepts combine and organize foundation concepts\n"
    #     conceptual_flow += "• Abstract concepts (highest level) represent broad themes and generalizations\n\n"
        
    #     # Show level relationships
    #     conceptual_flow += "🔄 LEVEL RELATIONSHIPS:\n"
    #     if hierarchy:
    #         for level in sorted(hierarchy.keys()):
    #             if level == 0:
    #                 conceptual_flow += f"• Level {level} concepts are foundational - they support higher levels\n"
    #             elif level == max_level:
    #                 conceptual_flow += f"• Level {level} concepts are most abstract - they encompass lower levels\n"
    #             else:
    #                 conceptual_flow += f"• Level {level} concepts bridge foundation and abstract concepts\n"
    #         conceptual_flow += "\n"
        
    #     # Enhanced instructions that work with hierarchy only
    #     instructions = """INSTRUCTIONS FOR USING THE KNOWLEDGE STRUCTURE:
    # 1. UNDERSTAND ABSTRACTION LEVELS: Higher numbered levels are more abstract/general
    # 2. BUILD FROM FOUNDATION: Level 0 concepts are your building blocks - start here for specifics  
    # 3. ORGANIZE BY HIERARCHY: Use intermediate levels to group and organize related concepts
    # 4. SYNTHESIZE AT TOP: Highest level concepts represent overarching themes and patterns
    # 5. TRACE CONCEPTUAL FLOW: Show how specific concepts (low levels) support general ones (high levels)
    # 6. LEVERAGE LEVEL STRUCTURE: Reference concepts from appropriate abstraction levels

    # KEY HIERARCHICAL INTERPRETATION:
    # - Level 0: Foundation concepts - specific, concrete, unmergeable building blocks
    # - Middle Levels: Organizing concepts - group and structure foundation concepts  
    # - Highest Level: Abstract themes - broad generalizations that encompass everything below
    # - Vertical Flow: Specific concepts support and build into more general concepts

    # Please provide a detailed answer that:
    # 1. Uses the hierarchical structure to organize your response from specific to general
    # 2. References foundation concepts (Level 0) for concrete examples and evidence
    # 3. Uses intermediate levels to show how concepts group and relate
    # 4. Connects to abstract themes (highest level) for broader insights
    # 5. Demonstrates understanding of how specificity builds into abstraction
    # 6. Structures your response to mirror the conceptual hierarchy"""

    #     if use_thinking:
    #         thinking_instruction = """
    # <think>
    # [Analyze the hierarchical structure. Consider:
    # - What foundation concepts (Level 0) provide the building blocks?
    # - How do intermediate levels organize and group these concepts? 
    # - What abstract themes (highest level) emerge from the structure?
    # - How does the hierarchy inform the answer to this specific question?
    # - What conceptual flow from specific to general best addresses the question?]
    # </think>

    # """
    #         return f"""Question: {question}

    # {hierarchy_text}
    # {conceptual_flow}
    # {instructions}

    # Answer:{thinking_instruction}"""
    #     else:
    #         return f"""Question: {question}

    # {hierarchy_text}
    # {conceptual_flow}
    # {instructions}

    # Answer:"""

    def create_enhanced_prompt_concise(self, question: str, hierarchy: Dict[int, List[str]], 
                                     hierarchical_context: Dict[str, Any] = None) -> str:
        """Create enhanced prompt with concise graph-level summary only"""
        
        # Extract concise graph summary if available
        if hierarchical_context and "graph_summary" in hierarchical_context:
            graph_summary = hierarchical_context["graph_summary"]
        else:
            # Create a basic concise summary if not available
            graph_summary = self._create_basic_graph_summary(hierarchy)
        
        # Create concise prompt
        knowledge_structure = "KNOWLEDGE GRAPH SUMMARY:\n\n"
        knowledge_structure += graph_summary
        
        instructions = """GUIDANCE:
Use this knowledge graph summary to provide a comprehensive answer. The summary captures the key concepts and their relationships in a concise format."""
        
        return f"""Question: {question}

{knowledge_structure}

{instructions}

Answer:"""
    
    def _create_basic_graph_summary(self, hierarchy: Dict[int, List[str]]) -> str:
        """Create a basic graph summary when hierarchical context is not available"""
        total_codes = sum(len(codes) for codes in hierarchy.values())
        total_levels = len(hierarchy)
        
        summary_parts = []
        for level in sorted(hierarchy.keys()):
            codes = hierarchy[level]
            if level == 0:
                level_desc = f"Foundation concepts ({len(codes)} codes)"
            elif level == max(hierarchy.keys()):
                level_desc = f"Abstract themes ({len(codes)} codes)"
            else:
                level_desc = f"Intermediate concepts ({len(codes)} codes)"
            
            # Show first few codes as examples
            examples = ", ".join(codes[:3])
            summary_parts.append(f"{level_desc}: {examples}")
        
        return f"Knowledge graph with {total_codes} concepts across {total_levels} levels:\n" + "\n".join(summary_parts)
    
    def create_enhanced_prompt(self, question: str, hierarchy: Dict[int, List[str]], 
                          use_thinking: bool = False, hierarchical_context: Dict[int, str] = None,
                          context_data: Dict[str, Any] = None) -> str:
        """Create enhanced prompt with streamlined hierarchical integration"""
        
        # Use rich context data if available (from enhanced summarizer)
        if context_data and "level_summaries" in context_data:
            return self._create_prompt_with_rich_context(question, context_data, use_thinking)
        
        # Fallback to basic hierarchical context
        return self._create_prompt_with_basic_context(question, hierarchy, hierarchical_context, use_thinking)

    def _create_prompt_with_rich_context(self, question: str, context_data: Dict[str, Any], 
                                        use_thinking: bool = False) -> str:
        """Create prompt using rich context data from enhanced summarizer"""

        level_summaries = context_data["level_summaries"]
        hierarchy = context_data["hierarchy"]
        graph_stats = context_data.get("graph_stats", {})
        
        # Build knowledge structure with integrated evidence
        knowledge_text = "KNOWLEDGE STRUCTURE:\n\n"
        
        max_level = max(hierarchy.keys()) if hierarchy else 0
        total_evidence = sum(level_data.get("evidence_count", 0) for level_data in level_summaries.values())

        for level in sorted(hierarchy.keys()):
            level_data = level_summaries.get(level, {})
            evidence_count = level_data.get("evidence_count", 0)
            
            # Level header with context
            if level == 0:
                knowledge_text += f"🔹 **Foundation Concepts** (Level {level}) - {evidence_count} evidence points:\n"
            elif level == max_level:
                knowledge_text += f"🎯 **Core Themes** (Level {level}) - {evidence_count} evidence points:\n"
            else:
                knowledge_text += f"🔗 **Organizing Concepts** (Level {level}) - {evidence_count} evidence points:\n"
            
            # Add concepts and their context
            if "summary" in level_data and level_data["summary"]:
                knowledge_text += f"{level_data['summary']}\n"
            else:
                # Fallback to basic concept listing
                for node in hierarchy.get(level, []):
                    knowledge_text += f"  • {node}\n"
            
            # Add relationship context if available
            if level_data.get("parent_relationships") and int(level) > 0:
                knowledge_text += f"*Connected to broader themes: {', '.join(level_data['parent_relationships'][:3])}*\n"
            if level_data.get("child_relationships") and int(level) < int(max_level):
                knowledge_text += f"*Includes specific aspects: {', '.join(level_data['child_relationships'][:3])}*\n"
            
            knowledge_text += "\n"
        
        # Add structure insight
        structure_insight = f"📊 **Structure Overview**: {total_evidence} total evidence points across {len(hierarchy)} conceptual levels"
        if graph_stats.get("edges", 0) > 0:
            structure_insight += f", {graph_stats['edges']} topical relationships"
        structure_insight += "\n\n"
        
        # Enhanced, specific instructions
        instructions = """**RESPONSE REQUIREMENTS:**

1. **CONCRETE EXAMPLES FIRST**: Start with specific, tangible examples from the foundation concepts. Name actual techniques, methods, or specific instances mentioned in the knowledge structure.

2. **SHOW THE MECHANISM**: Don't just list concepts - explain HOW they work together. Use phrases like "This works by..." or "The process involves..." to show the actual mechanisms.

3. **BALANCE SPECIFICITY AND INSIGHT**: 
   - Use foundation concepts for concrete details and specific techniques
   - Use organizing concepts to show how techniques connect and build upon each other
   - Use core themes to provide broader insights and principles

4. **DATAPOINT-BACKED EVIDENCE**: When making claims, reference specific evidence from the original datapoints/chunks. Use phrases like "As shown in the original content..." or "The video demonstrates..." or "In the actual footage..." to reference concrete evidence from the source material.

5. **PRACTICAL APPLICATION**: Explain not just what is done, but WHY it works and HOW it could be applied. Make the insights actionable.

6. **SYNTHESIS ACROSS LEVELS**: Show how specific techniques (foundation) create broader patterns (organizing) that reveal fundamental principles (core themes).

**RESPONSE STRUCTURE:**
- Begin with 2-3 specific, concrete examples from the foundation concepts
- Explain the mechanisms and processes that make these examples effective
- Show how these specific techniques connect to broader organizing principles
- Conclude with actionable insights that synthesize across all levels

**EVIDENCE INTEGRATION:**
- Reference specific moments, techniques, or content from the original datapoints
- Use concrete examples from the actual video content or text chunks
- Connect abstract concepts to tangible evidence from the source material
- When referencing evidence, mention specific details like "In the video content..." or "The original text shows..." or "As demonstrated in the footage..."
- Use the evidence count and source information to strengthen your claims (e.g., "This is supported by X evidence points from the original content")

Provide a comprehensive, evidence-backed response that demonstrates deep understanding of both the specific techniques and their broader implications."""
        
        if use_thinking:
            thinking_prompt = """
<think>
Let me analyze this step by step:
1. What specific examples and techniques are mentioned in the foundation concepts?
2. What concrete evidence from the original datapoints supports these concepts?
3. How do these specific techniques work together to create broader patterns?
4. What mechanisms and processes make these techniques effective?
5. How do the organizing concepts show the relationships between techniques?
6. What fundamental principles emerge from the core themes?
7. How can I connect abstract concepts to tangible evidence from the source material?
8. How can I synthesize this into actionable insights?
</think>

"""
            return f"""Question: {question}

{structure_insight}{knowledge_text}{instructions}

Answer:{thinking_prompt}"""
        else:
            return f"""Question: {question}

{structure_insight}{knowledge_text}{instructions}

Answer:"""

    def _create_prompt_with_basic_context(self, question: str, hierarchy: Dict[int, List[str]], 
                                        hierarchical_context: Dict[int, str] = None,
                                        use_thinking: bool = False) -> str:
        """Create prompt with basic hierarchical context (fallback method)"""
        
        knowledge_text = "KNOWLEDGE STRUCTURE:\n\n"
        max_level = max(hierarchy.keys()) if hierarchy else 0
        
        for level in sorted(hierarchy.keys()):
            nodes = hierarchy[level]
            context = hierarchical_context.get(level, "") if hierarchical_context else ""
            
            # Simplified level descriptions
            if level == 0:
                knowledge_text += f"🔹 **Foundation Concepts** (Level {level}):\n"
            elif level == max_level:
                knowledge_text += f"🎯 **Core Themes** (Level {level}):\n"
            else:
                knowledge_text += f"🔗 **Organizing Concepts** (Level {level}):\n"
            
            # List concepts
            for node in nodes:
                knowledge_text += f"  • {node}\n"
            
            # Add context if available
            if context and context.strip():
                # Clean up context presentation
                context_lines = [line.strip() for line in context.split('\n') if line.strip()]
                if context_lines:
                    knowledge_text += f"\nSupporting details:\n"
                    for line in context_lines[:3]:  # Limit to prevent overwhelming
                        knowledge_text += f"  {line}\n"
            
            knowledge_text += "\n"
        
        # Simplified conceptual guidance
        conceptual_guidance = """**Conceptual Flow**: Foundation concepts → Organizing concepts → Core themes
    *Foundation concepts provide specific details, organizing concepts show relationships, core themes reveal broader insights*

    """
        
        # Streamlined instructions
        instructions = """**Analysis Approach:**
    Use the knowledge structure to build a comprehensive response. Start with specific foundation concepts for concrete details, show how organizing concepts group related ideas, and connect to core themes for broader insights.

    """
        
        if use_thinking:
            thinking_prompt = """
    <think>
    What foundation concepts are most relevant? How do they organize into broader themes? What insights does this structure reveal about the question?
    </think>

    """
            return f"""Question: {question}

    {knowledge_text}{conceptual_guidance}{instructions}

    Answer:{thinking_prompt}"""
        else:
            return f"""Question: {question}

    {knowledge_text}{conceptual_guidance}{instructions}

    Answer:"""

    # Alternative: Even more minimal approach
    def create_minimal_enhanced_prompt(self, question: str, hierarchy: Dict[int, List[str]], 
                                    hierarchical_context: Dict[int, str] = None,
                                    context_data: Dict[str, Any] = None) -> str:
        """Create minimal prompt that lets the knowledge structure speak for itself"""
        
        if context_data and "level_summaries" in context_data:
            level_summaries = context_data["level_summaries"]
            
            knowledge_text = "**Available Knowledge:**\n\n"
            
            for level in sorted(level_summaries.keys()):
                level_data = level_summaries[level]
                if "summary" in level_data and level_data["summary"]:
                    knowledge_text += f"{level_data['summary']}\n\n"
            
            return f"""Question: {question}

    {knowledge_text}Using the knowledge above, provide a comprehensive and well-supported answer.

    Answer:"""
        
        else:
            # Fallback for basic context
            knowledge_text = "**Available Knowledge:**\n\n"
            
            for level in sorted(hierarchy.keys()):
                nodes = hierarchy[level]
                context = hierarchical_context.get(level, "") if hierarchical_context else ""
                
                for node in nodes:
                    knowledge_text += f"• {node}\n"
                
                if context:
                    context_preview = context.split('\n')[0][:150] + "..." if len(context) > 150 else context
                    knowledge_text += f"  Supporting details: {context_preview}\n"
                
                knowledge_text += "\n"
            
            return f"""Question: {question}

    {knowledge_text}Provide a comprehensive answer using the knowledge above.

    Answer:"""

    # Context-aware prompt selector
    def create_adaptive_prompt(self, question: str, hierarchy: Dict[int, List[str]], 
                            hierarchical_context: Dict[int, str] = None,
                            context_data: Dict[str, Any] = None,
                            prompt_style: str = "enhanced") -> str:
        """Create prompt with adaptive style based on available data and preference"""
        
        if prompt_style == "minimal":
            return self.create_minimal_enhanced_prompt(question, hierarchy, hierarchical_context, context_data)
        elif prompt_style == "rich" and context_data:
            return self._create_prompt_with_rich_context(question, context_data, use_thinking=False)
        else:
            return self.create_enhanced_prompt(question, hierarchy, use_thinking=False, 
                                         hierarchical_context=hierarchical_context, 
                                         context_data=context_data)
    
    async def call_llm_model(self, prompt: str, use_thinking: bool = False) -> str:
        """Call the LLM model with the given prompt"""
        try:
            if use_thinking:
                # Add thinking mode prefix
                thinking_prompt = f"<think>\nLet me think through this step by step:\n\n{prompt}\n\n</think>"
                response = await self._make_request(thinking_prompt)
            else:
                response = await self._make_request(prompt)
            
            return response
        except Exception as e:
            print(f"❌ Error calling LLM model: {e}")
            return "❌ Failed to generate response"

    async def call_llm_model_with_quality_check(self, prompt: str, use_thinking: bool = False, max_retries: int = 3) -> str:
        """Call the LLM model with quality validation and retry logic"""
        for attempt in range(max_retries):
            try:
                response = await self.call_llm_model(prompt, use_thinking)
                
                # Check response quality
                quality_score = self._evaluate_response_quality(response)
                
                if quality_score >= 0.8:  # Increased threshold for higher quality
                    print(f"   ✅ High-quality response achieved (score: {quality_score:.2f})")
                    return response
                else:
                    print(f"   ⚠️  Low-quality response (score: {quality_score:.2f}), retrying... (attempt {attempt + 1}/{max_retries})")
                    
            except Exception as e:
                print(f"   ❌ Error on attempt {attempt + 1}: {e}")
                if attempt == max_retries - 1:
                    raise e
        
        # If all retries failed, return the last response
        print(f"   ⚠️  Using best available response after {max_retries} attempts")
        return response

    def _evaluate_response_quality(self, response: str) -> float:
        """Evaluate the quality of a response based on key criteria"""
        score = 0.0
        total_criteria = 5  # Increased from 4 to 5 criteria
        
        # Check for citations (CHUNK references) - More stringent
        citations = response.count("CHUNK")
        if citations >= 5:
            score += 1.0
        elif citations >= 3:
            score += 0.7
        elif citations >= 1:
            score += 0.3
        
        # Check for cross-linking between points - More comprehensive
        cross_link_words = ["complement", "reinforce", "together", "while", "simultaneously", "harmony", "unified", "work together", "enhanced by", "seamless blend", "cohesive"]
        has_cross_links = any(word in response.lower() for word in cross_link_words)
        if has_cross_links:
            score += 1.0
        
        # Check for synthesis/insight - More comprehensive
        synthesis_words = ["unified", "pattern", "cohesive", "strategy", "ultimately", "overall", "reveals", "masterfully", "transforming", "immersive", "dynamic"]
        has_synthesis = any(word in response.lower() for word in synthesis_words)
        if has_synthesis:
            score += 1.0
        
        # Check for reasoning (not just evidence) - More comprehensive
        reasoning_words = ["because", "since", "as", "therefore", "thus", "reason", "why", "allows", "enables", "creates", "ensures", "makes"]
        has_reasoning = any(word in response.lower() for word in reasoning_words)
        if has_reasoning:
            score += 1.0
        
        # NEW: Check for strong thesis and structure
        thesis_indicators = ["masterfully", "transforming", "immersive", "compelling", "dynamic", "cohesive"]
        has_strong_thesis = any(word in response.lower() for word in thesis_indicators)
        has_clear_structure = response.count("First,") + response.count("Second,") + response.count("Third,") + response.count("What's more,") >= 2
        if has_strong_thesis and has_clear_structure:
            score += 1.0
        elif has_strong_thesis or has_clear_structure:
            score += 0.5
        
        return score / total_criteria

    async def _make_request(self, prompt: str) -> str:
        """Make the actual HTTP request to the LLM"""
        system_message = """You are a helpful assistant with access to hierarchical knowledge structures. 
Use the provided concept hierarchy to give comprehensive, well-structured answers with specific examples.

Focus on:
- Using specific concepts from the hierarchy
- Providing concrete examples and evidence
- Making connections between different levels of concepts
- Creating convincing, detailed responses

IMPORTANT: If the prompt contains <think> tags, you MUST use them to show your reasoning process before providing your answer."""
        
        payload = {
            "model": self.model_config['model_name'],
            "messages": [
                {"role": "system", "content": system_message},
                {"role": "user", "content": prompt}
            ],
            "temperature": self.model_config['temperature'],
            "max_tokens": self.model_config['max_tokens'],
            "stop": ["Human:", "Assistant:"]
        }
        
        async with self.session.post(
            f"{self.model_config['base_url']}/v1/chat/completions",
            json=payload,
            timeout=120
        ) as response:
            if response.status == 200:
                result = await response.json()
                return result['choices'][0]['message']['content']
            else:
                print(f"❌ Error {response.status}: {await response.text()}")
                return None
    
    async def answer_question_standard(self, question: str, use_thinking: bool = False) -> str:
        """Answer question using standard approach (no graph)"""
        print("🤔 Answering question (standard mode)...")
        
        prompt = self.create_standard_prompt(question, use_thinking)
        response = await self.call_llm_model_with_quality_check(prompt, use_thinking)
        
        if response and "❌ Failed" not in response:
            return response
        else:
            return "❌ Failed to generate answer"
    
    async def answer_question_enhanced(self, question: str, use_thinking: bool = False, strategy: str = "dynamic", simple_prompt: bool = False) -> str:
        """Answer question using enhanced approach with context retrieval"""
        print(f"🚀 Running ENHANCED question answering...")
        
        try:
            # Retrieve context using the configured retriever
            context = await self.context_retriever.retrieve_context(question, strategy=strategy)
            
            # Log context summary
            context_summary = self.context_retriever.get_context_summary(context)
            print(f"📊 Context: {context_summary}")
            
            # Check if context retrieval failed
            if 'error' in context:
                print(f"⚠️ Context retrieval failed: {context['error']}")
                print("⚠️ Falling back to standard mode")
                return await self.answer_question_standard(question, use_thinking)
            
            # Create prompt with retrieved context
            prompt = self.create_context_prompt(question, context, use_thinking, simple_prompt)
            response = await self.call_llm_model_with_quality_check(prompt, use_thinking)
            
            if response and "❌ Failed" not in response:
                return response
            else:
                return "❌ Failed to generate enhanced answer"
                
        except Exception as e:
            print(f"❌ Enhanced question answering failed: {e}")
            print("⚠️ Falling back to standard mode")
            return await self.answer_question_standard(question, use_thinking)
    
    async def answer_question_with_chunks(self, question: str, chunks: List[Dict[str, Any]], 
                                         strategy: str = "dynamic", max_chars: int = 25000, 
                                         chunk_limit: int = 1200, top_k: int = 10, 
                                         simple_prompt: bool = False) -> Dict[str, Any]:
        """
        Answer a question using chunks with configurable strategy
        
        Args:
            question: The question to answer
            chunks: List of chunk dictionaries with 'content'/'chunk_id' and 'score' keys
            strategy: "fixed" or "dynamic"
            max_chars: Maximum characters for context (dynamic strategy)
            chunk_limit: Maximum characters per chunk (truncation)
            top_k: Number of chunks to use (fixed strategy)
            
        Returns:
            Dictionary with answer, metadata, and performance info
        """
        start_time = time.time()
        
        if strategy == "fixed":
            context, chunks_used = self._create_fixed_context(chunks, top_k, chunk_limit)
        elif strategy == "dynamic":
            context, chunks_used = self._create_dynamic_context(chunks, max_chars, chunk_limit)
        else:
            raise ValueError(f"Unknown strategy: {strategy}. Use 'fixed' or 'dynamic'")
        
        # Generate answer using our custom analytical prompt
        context_dict = {
            'method': 'data_retrieval',
            'chunks': chunks
        }
        
        prompt = self.create_context_prompt(question, context_dict, use_thinking=False, simple_prompt=simple_prompt)
        answer = await self.call_llm_model(prompt, use_thinking=False)  # Disabled for now
        
        end_time = time.time()
        
        return {
            'answer': answer,
            'strategy': strategy,
            'chunks_used': chunks_used,
            'context_length': len(context),
            'prompt_length': len(prompt),
            'answer_length': len(answer),
            'response_time': end_time - start_time,
            'chunk_limit': chunk_limit,
            'max_chars': max_chars if strategy == "dynamic" else None,
            'top_k': top_k if strategy == "fixed" else None
        }
    
    def _create_fixed_context(self, chunks: List[Dict[str, Any]], top_k: int, chunk_limit: int) -> tuple[str, int]:
        """Create context with fixed number of chunks"""
        selected_chunks = chunks[:top_k]
        context_parts = []
        
        for i, chunk in enumerate(selected_chunks, 1):
            content = chunk.get('content', chunk.get('chunk_id', str(chunk)))
            
            # Truncate if needed
            if len(content) > chunk_limit:
                content = content[:chunk_limit] + "..."
            
            context_parts.append(f"CHUNK {i} (Score: {chunk['score']:.3f}):\n{content}\n")
        
        return "\n".join(context_parts), len(selected_chunks)
    
    def _create_dynamic_context(self, chunks: List[Dict[str, Any]], max_chars: int, chunk_limit: int) -> tuple[str, int]:
        """Create context with dynamic fitting"""
        context_parts = []
        total_chars = 0
        chunks_used = 0
        
        for chunk in chunks:
            content = chunk.get('content', chunk.get('chunk_id', str(chunk)))
            
            # Truncate chunk to chunk_limit characters
            if len(content) > chunk_limit:
                content = content[:chunk_limit] + "..."
            
            chunk_length = len(content)
            
            if total_chars + chunk_length <= max_chars:
                chunks_used += 1
                context_parts.append(f"CHUNK {chunks_used} (Score: {chunk['score']:.3f}):\n{content}\n")
                total_chars += chunk_length
            else:
                break
        
        return "\n".join(context_parts), chunks_used

    def save_answer(self, question: str, answer: str, mode: str, output_path: str):
        """Save the question and answer to a file"""
        result = {
            'question': question,
            'answer': answer,
            'mode': mode,
            'timestamp': pd.Timestamp.now().isoformat()
        }
        
        # Save as JSON
        with open(output_path, 'w') as f:
            json.dump(result, f, indent=2)
        
        print(f"💾 Saved answer to: {output_path}")

async def answer_question(question: str, mode: str = "standard",
                        output_path: Optional[str] = None,
                        model_config: Dict[str, Any] = None,
                        context_retriever: BaseContextRetriever = None,
                        use_thinking: bool = False, strategy: str = "dynamic", simple_prompt: bool = False) -> str:
    """
    Answer a question using either standard or enhanced mode
    
    Args:
        question: The question to answer
        mode: "standard" or "enhanced" (enhanced uses context retrieval)
        output_path: Path to save the answer
        model_config: Model configuration dict
        context_retriever: Context retriever for enhanced mode
        use_thinking: Whether to enable thinking mode (shows step-by-step reasoning)
        simple_prompt: Whether to use simplified prompt for enhanced mode (for baseline comparison)
        
    Returns:
        The generated answer
    """
    async with QuestionAnswerer(model_config=model_config, context_retriever=context_retriever) as answerer:
        if mode == "enhanced":
            # Enhanced mode - uses context retrieval
            answer = await answerer.answer_question_enhanced(question, use_thinking, strategy, simple_prompt)
            mode = "enhanced"
        else:
            # Standard mode
            answer = await answerer.answer_question_standard(question, use_thinking)
            mode = "standard"
        
        # Save answer if output path provided
        if output_path:
            answerer.save_answer(question, answer, mode, output_path)
        
        return answer

if __name__ == "__main__":
    # Example usage
    import argparse
    
    parser = argparse.ArgumentParser(description="Question Answering with Topological Graph")
    parser.add_argument("--question", required=True, help="Question to answer")
    parser.add_argument("--graph-dir", help="Directory containing topological graph data")
    parser.add_argument("--output", help="Output file path")
    parser.add_argument("--mode", choices=["standard", "enhanced"], default="auto",
                       help="Answering mode (auto chooses based on graph availability)")
    
    args = parser.parse_args()
    
    async def main():
        if args.mode == "enhanced" and not args.graph_dir:
            print("❌ Enhanced mode requires --graph-dir")
            return
        
        answer = await answer_question(
            question=args.question,
            graph_dir=args.graph_dir if args.mode != "standard" else None,
            output_path=args.output
        )
        
        print("\n" + "="*50)
        print("ANSWER:")
        print("="*50)
        print(answer)
    
    asyncio.run(main()) 