from __future__ import annotations

# from dataclasses import dataclass, field
from typing import TypedDict, List

from langgraph.graph import add_messages
from typing_extensions import Annotated


# import operator
# from dataclasses import dataclass, field
from typing_extensions import Annotated

from agents.schemas import SearchResult, Reference

def update_searcher_state(left: SearcherState, right: SearcherState) -> SearcherState:

    existing_search_count = left.get("search_count", 0) if left else 0
    new_search_count = right.get("search_count", 0) if right else 0

    search_count = existing_search_count + new_search_count

    # Get existing lists or empty lists if None
    existing_keywords = left.get("used_keywords", []) if left else []
    existing_results = left.get("search_results", []) if left else []
    
    new_keywords = right.get("used_keywords", []) if right else []
    new_results = right.get("search_results", []) if right else []
    
    # Deduplicate keywords (preserves order)
    all_keywords = existing_keywords + new_keywords
    unique_keywords = list(dict.fromkeys(all_keywords))
    
    # Deduplicate search results by URL
    # Use a dict to handle duplicates
    result_dict = {}
    
    # First add existing results
    for result in existing_results:
        result_dict[result.url] = result

    for result in new_results:
        result_dict[result.url] = result

    
    
    # Then add new results
    # For search results, we typically want to keep the latest snippet
    # since search result snippets can vary based on query context

    # for result in new_results:
    #     if hasattr(result, 'url'):
    #         result_dict[result.url] = result
    #     else:
    #         print(f"Warning: Invalid new result type: {type(result)} - {result}")

    # Convert to list of SearchResult objects
    unique_results = list(result_dict.values())

    
    # Handle history_search_results
    existing_history_results = left.get("history_search_results", []) if left else []
    new_history_results = right.get("history_search_results", []) if right else []
    
    # Combine and deduplicate history results by URL
    history_dict = {}
    for result in existing_history_results:
        history_dict[result.url] = result
    for result in new_history_results:
        history_dict[result.url] = result
    
    unique_history_results = list(history_dict.values())
    
    # Handle search_cache
    existing_cache = left.get("search_cache", {}) if left else {}
    new_cache = right.get("search_cache", {}) if right else {}
    merged_cache = {**existing_cache, **new_cache}  # New cache entries override existing ones
    
    return SearcherState(
        search_count=search_count,
        used_keywords=unique_keywords,
        history_search_results=unique_history_results,
        search_results=unique_results,
        search_cache=merged_cache
    )

def update_browser_state(left: BrowserState, right: BrowserState) -> BrowserState:

    existing_visit_count = left.get("visit_count", 0) if left else 0
    new_visit_count = right.get("visit_count", 0) if right else 0

    visit_count = existing_visit_count + new_visit_count

    # Get existing lists or empty lists if None
    existing_urls = left.get("visited_urls", []) if left else []
    existing_refs = left.get("found_references", []) if left else []
    
    new_urls = right.get("visited_urls", []) if right else []
    new_refs = right.get("found_references", []) if right else []
    
    # Deduplicate URLs (preserves order)
    all_urls = existing_urls + new_urls
    unique_urls = list(dict.fromkeys(all_urls))
    
    # Deduplicate references by URL
    # Use a dict to merge references with the same URL
    ref_dict = {}
    
    # First add existing references
    for ref in existing_refs:
        ref_dict[ref.url] = ref
    
    # Then add new references (this will override if same URL exists)
    # Or merge information_list if you want to combine them
    for ref in new_refs:
        if ref.url in ref_dict:
            # Merge information lists and deduplicate
            existing_info = ref_dict[ref.url].information_list
            combined_info = existing_info + ref.information_list
            unique_info = list(dict.fromkeys(combined_info))  # Deduplicate info items
            
            # Create new Reference with merged information
            ref_dict[ref.url] = Reference(
                url=ref.url,
                information_list=unique_info
            )
        else:
            ref_dict[ref.url] = ref
    
    # Convert back to list (preserves insertion order in Python 3.7+)
    unique_refs = list(ref_dict.values())
    
    # Handle history_found_references
    existing_history_refs = left.get("history_found_references", []) if left else []
    new_history_refs = right.get("history_found_references", []) if right else []
    
    # Combine and deduplicate history references by URL with information merging
    history_ref_dict = {}
    for ref in existing_history_refs:
        history_ref_dict[ref.url] = ref
    
    for ref in new_history_refs:
        if ref.url in history_ref_dict:
            # Merge information lists and deduplicate
            existing_info = history_ref_dict[ref.url].information_list
            combined_info = existing_info + ref.information_list
            unique_info = list(dict.fromkeys(combined_info))  # Deduplicate info items
            
            # Create new Reference with merged information
            history_ref_dict[ref.url] = Reference(
                url=ref.url,
                information_list=unique_info
            )
        else:
            history_ref_dict[ref.url] = ref
    
    unique_history_refs = list(history_ref_dict.values())
    
    # Handle visit_cache
    existing_cache = left.get("visit_cache", {}) if left else {}
    new_cache = right.get("visit_cache", {}) if right else {}
    merged_cache = {**existing_cache, **new_cache}  # New cache entries override existing ones
    
    return BrowserState(
        visit_count=visit_count,
        visited_urls=unique_urls,
        history_found_references=unique_history_refs,
        found_references=unique_refs,
        visit_cache=merged_cache
    )

class OverallState(TypedDict):
    messages: Annotated[list, add_messages]
    current_sub_question: str
    current_sub_question_iteration: int
    current_summary: str
    final_answer: str
    sub_verified: bool
    final_verified: bool
    searcher_state: Annotated[SearcherState, update_searcher_state]  # Added reducer
    browser_state: Annotated[BrowserState, update_browser_state]  # Added reducer
    instruction_state: InstructionState

class SearcherState(TypedDict):
    search_count: int
    used_keywords: List[str]
    history_search_results: List[SearchResult]
    search_results: List[SearchResult]
    search_cache: dict

class BrowserState(TypedDict):
    visit_count: int
    visited_urls: List[str]
    history_found_references: List[Reference]
    found_references: List[Reference]
    visit_cache: dict

class InstructionState(TypedDict):
    orchestrator_instructions: List[str]
    searcher_instructions: List[str]
    browser_instructions: List[str]