import os
import json
import random
import logging
from dotenv import load_dotenv
from typing import List
import threading
from concurrent.futures import ThreadPoolExecutor, as_completed

from langchain_qwq import ChatQwen
from langchain_core.runnables import RunnableConfig

from agents.state import OverallState, SearcherState, BrowserState
from agents.prompts import *
from agents.schemas import *
from agents.qwq.config import Configuration
from agents.utils import get_user_question, get_search_results, visit, split_webpage_content

load_dotenv(dotenv_path=".env")

# Setup logging
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
logger = logging.getLogger(__name__)

DASHSCOPE_API_KEY = os.getenv("DASHSCOPE_API_KEY")
SERP_API_KEY = os.getenv("SERP_API_KEY")
JINA_API_KEY = os.getenv("JINA_API_KEY")

# maximum number of sub-questions generated at one time
MAX_Q = 5

def advanced_searcher(state: OverallState, config: RunnableConfig) -> OverallState:
    """
    This is an advanced searcher block that searches the web in multiple threads.
    """
    logger.info("Executing advanced searcher")
    configurable = Configuration.from_runnable_config(config)
    llm = ChatQwen(
        model=configurable.searcher_model,
        api_key=DASHSCOPE_API_KEY,
        # base_url="...",
        # organization="...",
        # other params...
    )

    if state.get('instruction_state', {}).get('searcher_instructions'):
        experiences = f"**Some experiences that might be userful:**\n{'\n'.join(state.get('instruction_state', {}).get('searcher_instructions', []))}"
    else:
        experiences = ""

    def _break_down_goal():
        while True:
            structured_llm = llm.with_structured_output(BreakDownGoal)
            formatted_prompt = break_down_goal_prompt.format(question=get_user_question(state['messages']),
                                                                sub_goal=state.get('current_sub_question', ''),
                                                                current_date=get_current_date())
            result = structured_llm.invoke(formatted_prompt)
            try:
                return result.list_of_goals
            except:
                continue

    def _search_one_query(query: str, search_cache: dict, cache_lock: threading.Lock):
        # Thread-safe cache check
        with cache_lock:
            if query in search_cache:
                search_results = search_cache[query]
                logger.info(f"Cache hit for query: {query}")
            else:
                search_results = None
        
        # If not in cache, perform search
        if search_results is None:
            logger.info(f"Searching API for query: {query}")
            api_key = SERP_API_KEY
            search_results = get_search_results(query=query, api_key=api_key)
            
            # Thread-safe cache update
            with cache_lock:
                search_cache[query] = search_results
        
        # Convert raw results to proper format for LLM processing
        if isinstance(search_results, str):
            # Handle error cases
            formatted_results = search_results
        else:
            formatted_results = json.dumps(search_results, indent=4)
            
        structured_llm = llm.with_structured_output(SelectedSearchResults)
        formatted_prompt = search_result_selection_prompt.format(query=query,
                                                                 original_question=get_user_question(state['messages']),
                                                                 sub_question=state.get('current_sub_question', ''),
                                                                #  current_summary=state['current_summary'],
                                                                 search_results=formatted_results,
                                                                 current_date=get_current_date(),
                                                                 experiences=experiences)
        result = structured_llm.invoke(formatted_prompt)
        try:
            return query, result.selected_results
        except:
            return query, []

    def _get_query_list(goal: str):
        logger.info(f"Generating queries for goal: {goal}")
        structured_llm = llm.with_structured_output(QueryWriter)
        formatted_prompt = query_writer_prompt.format(query_count=configurable.number_of_queries_per_search, 
                                                      current_date=get_current_date(),
                                                      original_question=get_user_question(state['messages']),
                                                      sub_question=state.get('current_sub_question', ''),
                                                      used_search_keywords_and_phrases=state.get('searcher_state', {}).get('used_keywords', []),
                                                      current_summary=state.get('current_summary', ''),
                                                      experiences=experiences)
        result = structured_llm.invoke(formatted_prompt)
        try:
            return result.search_query_list
        except:
            return []

    # Initialize shared resources
    search_cache = state.get('searcher_state', {}).get('search_cache', {})
    cache_lock = threading.Lock()
    search_count = 0
    used_keywords = []
    selected_search_results_list = []
    
    # Break down goals
    list_of_goals = _break_down_goal()
    logger.info(f"Processing {len(list_of_goals)} goals")
    
    # Collect all queries from all goals first
    all_queries = []
    for goal in list_of_goals:
        query_list = _get_query_list(goal)
        logger.info(f"Goal: '{goal}' generated {len(query_list)} queries")
        all_queries.extend(query_list)
        used_keywords.extend(query_list)
    
    search_count = len(all_queries)
    logger.info(f"Total queries to process: {search_count}")
    
    # Process all queries in parallel using ThreadPoolExecutor
    max_workers = min(10, len(all_queries))  # Limit concurrent requests to avoid API rate limits
    
    with ThreadPoolExecutor(max_workers=max_workers) as executor:
        # Submit all search tasks
        future_to_query = {
            executor.submit(_search_one_query, query, search_cache, cache_lock): query 
            for query in all_queries
        }
        
        # Collect results as they complete
        for future in as_completed(future_to_query):
            query = future_to_query[future]
            try:
                original_query, selected_results = future.result()
                selected_search_results_list.extend(selected_results)
                logger.info(f"Completed search for query: {original_query}")
            except Exception as exc:
                logger.error(f"Query '{query}' generated an exception: {exc}")
    
    logger.info(f"Completed all searches. Total results: {len(selected_search_results_list)}")
    
    searcher_state = SearcherState(
        search_count=search_count,
        used_keywords=used_keywords,
        search_cache=search_cache,
        search_results=selected_search_results_list
    )
    return {"searcher_state": searcher_state}

def advanced_browser(state: OverallState, config: RunnableConfig) -> OverallState:
    """
    This is an advanced browser block that visits web pages, extracts relevant information, and creates references from the collected content in multiple threads.
    """
    logger.info("🌐 Starting web browsing process...")
    configurable = Configuration.from_runnable_config(config)
    llm = ChatQwen(
        model=configurable.browser_model,
        api_key=DASHSCOPE_API_KEY,
    )

    if state.get('instruction_state', {}).get('browser_instructions'):
        experiences = f"**Some experiences that might be userful:**\n{'\n'.join(state.get('instruction_state', {}).get('browser_instructions', []))}"
    else:
        experiences = ""

    def _get_url_list(url_chunk: List[SearchResult]):
        structured_llm = llm.with_structured_output(UrlSelection)
        formatted_prompt = url_selection_prompt.format(original_question=get_user_question(state['messages']),
                                                      sub_question=state.get('current_sub_question', ''),
                                                    #   current_summary=state['current_summary'],
                                                      list_of_urls_and_snippets=json.dumps([result.dict() for result in url_chunk], indent=4),
                                                      current_date=get_current_date(),
                                                      experiences=experiences)
        result = structured_llm.invoke(formatted_prompt)
        try:
            return result.selected_urls
        except:
            return []

    def _extract_information(webpage_content_parts: List[str]):
        structured_llm = llm.with_structured_output(ExtractInformation)
        information_list = []
        should_continue = True
        for i, webpage_content_part in enumerate(webpage_content_parts, 1):
            logger.info(f"📄 Processing part {i}/{len(webpage_content_parts)}")
            webpage_content_part = "Part " + str(i) + "/" + str(len(webpage_content_parts)) + ":\n" + webpage_content_part.strip()
            formatted_prompt = extract_information_prompt.format(webpage_content=webpage_content_part,
                                                                original_question=get_user_question(state['messages']),
                                                                sub_question=state.get('current_sub_question', ''),
                                                                current_date=get_current_date())
            result = structured_llm.invoke(formatted_prompt)
            try:
                # Extend instead of append to flatten the list of lists into a single list
                information_list.extend(result.information_list)
                should_continue = result.should_continue
            except:
                continue
            if not should_continue:
                break
        return information_list

    # Get search results from the searcher state
    search_results = state.get('searcher_state', {}).get('search_results', [])
    if not search_results:
        logger.warning("No search results found in state")
        return {"browser_state": BrowserState(
            visit_count=0,
            visited_urls=[],
            found_references=[],
            visit_cache={}
        )}
    
    logger.info(f"📊 Processing {len(search_results)} search results")
    
    # Split the search results into chunks of 10 results each
    chunk_size = 10
    search_result_chunks = [search_results[i:i + chunk_size] for i in range(0, len(search_results), chunk_size)]
    logger.info(f"📦 Split into {len(search_result_chunks)} chunks")
    
    # Select URLs from each chunk and collect them together
    all_selected_urls = []
    for i, chunk in enumerate(search_result_chunks, 1):
        logger.info(f"🔍 Selecting URLs from chunk {i}/{len(search_result_chunks)}")
        selected_urls = _get_url_list(chunk)
        all_selected_urls.extend(selected_urls)
        logger.info(f"✅ Selected {len(selected_urls)} URLs from chunk {i}")
    
    logger.info(f"🌐 Total URLs selected for browsing: {len(all_selected_urls)}")
    
    # Get browser cache (using correct field name)
    visit_cache = state.get('browser_state', {}).get('visit_cache', {})
    visited_urls = state.get('browser_state', {}).get('visited_urls', [])
    cache_lock = threading.Lock()
    
    def _process_single_url(url: str):
        """Process a single URL: visit, split content, and extract information"""
        try:
            # Check cache first (thread-safe)
            with cache_lock:
                if url in visit_cache:
                    logger.info(f"📋 Cache hit for URL: {url}")
                    webpage_content = visit_cache[url]
                else:
                    webpage_content = None
            
            # If not in cache, visit the URL
            if webpage_content is None:
                logger.info(f"🌐 Visiting URL: {url}")
                webpage_content = visit(url, JINA_API_KEY)
                
                # Update cache and visited URLs (thread-safe)
                with cache_lock:
                    visit_cache[url] = webpage_content
                    if url not in visited_urls:
                        visited_urls.append(url)
            
            # Split webpage content into parts
            webpage_content_parts = split_webpage_content(webpage_content, max_length=5000)
            logger.info(f"📄 Split {url} into {len(webpage_content_parts)} parts")
            
            # Extract information from all parts
            information_list = _extract_information(webpage_content_parts)
            logger.info(f"📝 Extracted {len(information_list)} pieces of information from {url}")
            
            return url, information_list
            
        except Exception as exc:
            logger.error(f"❌ Error processing URL {url}: {exc}")
            return url, []
    
    # Visit URLs and extract information in multiple threads
    max_workers = min(5, len(all_selected_urls))  # Limit concurrent requests to avoid overwhelming servers
    all_references = []
    visit_count = 0
    
    if all_selected_urls:
        with ThreadPoolExecutor(max_workers=max_workers) as executor:
            # Submit all URL processing tasks
            future_to_url = {
                executor.submit(_process_single_url, url): url 
                for url in all_selected_urls
            }
            
            # Collect results as they complete
            for future in as_completed(future_to_url):
                url = future_to_url[future]
                try:
                    processed_url, information_list = future.result()
                    
                    # Create Reference object if we have information
                    if information_list:
                        reference = Reference(
                            url=processed_url,
                            information_list=information_list
                        )
                        all_references.append(reference)
                        logger.info(f"📝 Created reference for {processed_url} with {len(information_list)} pieces of information")
                    
                    visit_count += 1
                    logger.info(f"✅ Completed processing URL: {processed_url}")
                except Exception as exc:
                    logger.error(f"❌ URL '{url}' generated an exception: {exc}")
    
    logger.info(f"🎯 Total references created: {len(all_references)}")
    
    # Return the Browser State
    browser_state = BrowserState(
        visit_count=visit_count,
        visited_urls=all_selected_urls,
        found_references=all_references,
        visit_cache=visit_cache
    )
    
    logger.info("🎉 Advanced browser process completed!")
    return {"browser_state": browser_state}

def deep_browser(state: OverallState, config: RunnableConfig) -> OverallState:
    """
    This is a deep browser block that visits web pages, extracts relevant information, and creates references from the collected content with parallelism and optimized limits.
    """
    logger.info("🌐 Starting optimized deep web browsing process...")
    configurable = Configuration.from_runnable_config(config)
    llm = ChatQwen(
        model=configurable.browser_model,
        api_key=DASHSCOPE_API_KEY,
    )

    if state.get('instruction_state', {}).get('browser_instructions'):
        experiences = f"**Some experiences that might be userful (or not):**\n{'\n'.join(state.get('instruction_state', {}).get('browser_instructions', []))}"
    else:
        experiences = ""
    
    # select the root urls
    def _select_root_urls():
        structured_llm = llm.with_structured_output(SelectRootUrls)
        formatted_prompt = select_root_urls_prompt.format(question=get_user_question(state['messages']),
                                                          sub_goal=state.get('current_sub_question', ''),
                                                          list_of_urls_and_snippets=json.dumps([result.dict() for result in state.get('searcher_state', {}).get('search_results', [])], indent=4),
                                                        current_date=get_current_date(),
                                                        experiences=experiences)
        while True:
            result = structured_llm.invoke(formatted_prompt)
            try:
                return result.selected_urls
            except:
                continue


    # process a single page with optimized batching
    def _extract_information_and_urls(webpage_content_parts: List[str]):
        structured_llm = llm.with_structured_output(DeepBrowse)
        information_list = []
        inner_url_list = []
        
        # Batch smaller parts together to reduce LLM calls
        if len(webpage_content_parts) <= 2:
            # Process all parts together for small content
            combined_content = "\n\n".join([f"Part {i+1}/{len(webpage_content_parts)}:\n{part.strip()}" 
                                          for i, part in enumerate(webpage_content_parts)])
            formatted_prompt = deep_browse_prompt.format(webpage_content=combined_content,
                                                        question=get_user_question(state['messages']),
                                                        sub_goal=state.get('current_sub_question', ''),
                                                        current_date=get_current_date())
            result = structured_llm.invoke(formatted_prompt)
            try:
                information_list.extend(result.information)
                inner_url_list.extend(result.inner_url_list)
            except:
                pass
        else:
            # For larger content, process first 6 parts only to save time (matching OpenAI change)
            for i in range(min(6, len(webpage_content_parts))):
                webpage_content_part = f"Part {i+1}/{len(webpage_content_parts)}:\n{webpage_content_parts[i].strip()}"
                formatted_prompt = deep_browse_prompt.format(webpage_content=webpage_content_part,
                                                            question=get_user_question(state['messages']),
                                                            sub_goal=state.get('current_sub_question', ''),
                                                            current_date=get_current_date())
                result = structured_llm.invoke(formatted_prompt)
                try:
                    information_list.extend(result.information)
                    inner_url_list.extend(result.inner_url_list)
                except:
                    continue
                
                # Stop early if we have enough information
                if len(information_list) > 5:
                    break
                    
        return information_list, inner_url_list

    visit_count = 0
    visit_cache = state.get('browser_state', {}).get('visit_cache', {})
    visited_urls = state.get('browser_state', {}).get('visited_urls', [])
    
    all_references = []
    url_to_visit_queue = []
    url_to_visit_queue.extend(_select_root_urls())
    
    # Parallel processing function for a single URL
    def _process_single_url(url_info):
        url, depth = url_info
        try:
            logger.info(f"🌐 Processing URL (depth {depth}): {url}")
            
            # Check cache first
            if url in visit_cache:
                webpage_content = visit_cache[url]
            else:
                webpage_content = visit(url, JINA_API_KEY)
                visit_cache[url] = webpage_content
            
            # Split webpage content into manageable parts (smaller chunks for faster processing)
            webpage_content_parts = split_webpage_content(webpage_content, max_length=3000)
            
            # Extract information and inner URLs
            information_list, inner_url_list = _extract_information_and_urls(webpage_content_parts)
            
            # Create Reference object if we have information
            reference = None
            if information_list:
                reference = Reference(
                    url=url,
                    information_list=information_list
                )
            
            return {
                'url': url,
                'depth': depth,
                'reference': reference,
                'inner_urls': inner_url_list[:max_urls_per_depth],  # Limit inner URLs
                'success': True
            }
        except Exception as exc:
            logger.error(f"❌ Error processing URL {url}: {exc}")
            return {
                'url': url,
                'depth': depth,
                'reference': None,
                'inner_urls': [],
                'success': False
            }
    
    # Track depth for each URL to prevent infinite recursion
    url_depth = {}
    max_depth = 3  # Reduced depth limit for better performance
    max_total_visits = min(configurable.max_visit_count, 20)  # Cap at 20 visits for deep browser
    max_urls_per_depth = 5  # Limit URLs added per page to prevent explosion
    batch_size = 4  # Process URLs in parallel batches
    
    logger.info(f"🚀 Starting optimized deep browse with {len(url_to_visit_queue)} root URLs (max {max_total_visits} visits, depth {max_depth}, parallel batches of {batch_size})")
    
    # Process URLs in parallel batches until empty or limits reached
    while url_to_visit_queue and visit_count < max_total_visits:
        # Prepare batch of URLs to process in parallel
        current_batch = []
        visited_urls_set = set(visited_urls)
        
        # Collect URLs for current batch
        while url_to_visit_queue and len(current_batch) < batch_size and visit_count + len(current_batch) < max_total_visits:
            current_url = url_to_visit_queue.pop(0)
            current_depth = url_depth.get(current_url, 0)
            
            # Skip if URL already visited or depth exceeded
            if current_url not in visited_urls_set and current_depth <= max_depth:
                current_batch.append((current_url, current_depth))
                url_depth[current_url] = current_depth
        
        if not current_batch:
            break
            
        logger.info(f"🔄 Processing batch of {len(current_batch)} URLs in parallel...")
        
        # Process batch in parallel using ThreadPoolExecutor
        batch_results = []
        with ThreadPoolExecutor(max_workers=min(4, len(current_batch))) as executor:
            future_to_url = {executor.submit(_process_single_url, url_info): url_info for url_info in current_batch}
            
            for future in as_completed(future_to_url):
                url_info = future_to_url[future]
                try:
                    result = future.result()
                    batch_results.append(result)
                except Exception as exc:
                    logger.error(f"❌ Batch processing error for {url_info[0]}: {exc}")
                    batch_results.append({
                        'url': url_info[0],
                        'depth': url_info[1],
                        'reference': None,
                        'inner_urls': [],
                        'success': False
                    })
        
        # Process batch results
        for result in batch_results:
            url = result['url']
            depth = result['depth']
            
            # Add reference if successful
            if result['reference']:
                all_references.append(result['reference'])
                logger.info(f"📝 Added reference for {url} with {len(result['reference'].information_list)} pieces of information")
            
            # Add inner URLs to queue if within depth limit
            if depth < max_depth and len(url_to_visit_queue) < 50:  # Limit queue size
                queue_urls_set = set(url_to_visit_queue)
                new_urls_added = 0
                
                for inner_url in result['inner_urls']:
                    if inner_url not in visited_urls_set and inner_url not in queue_urls_set:
                        url_to_visit_queue.append(inner_url)
                        url_depth[inner_url] = depth + 1
                        new_urls_added += 1
                
                if new_urls_added > 0:
                    logger.info(f"🔗 Added {new_urls_added} new URLs from {url} to queue")
            
            # Track as visited
            visited_urls.append(url)
            visit_count += 1
        
        logger.info(f"✅ Completed batch processing. Total visits: {visit_count}/{max_total_visits}, Queue size: {len(url_to_visit_queue)}")
    
    logger.info(f"🎯 Deep browsing completed. Processed {visit_count} URLs, created {len(all_references)} references")
    
    # Create and return the Browser State
    browser_state = BrowserState(
        visit_count=visit_count,
        visited_urls=visited_urls,
        found_references=all_references,
        visit_cache=visit_cache
    )
    
    logger.info("🎉 Deep browser process completed!")
    return {"browser_state": browser_state}

def advanced_summarizer(state: OverallState, config: RunnableConfig) -> OverallState:
    """
    This is an advanced summarizer block that summarizes the collected information from the browser state.
    """
    logger.info("🌐 Starting advanced summarizer process...")
    configurable = Configuration.from_runnable_config(config)
    llm = ChatQwen(
        model=configurable.summarizer_model,
        api_key=DASHSCOPE_API_KEY,
    )
    
    # combine all information into one list
    found_references = state.get('browser_state', {}).get('found_references', [])
    information_list = []
    for reference in found_references:
        information_list.extend(reference.information_list)

    logger.info(f"📚 Found {len(information_list)} pieces of information from {len(found_references)} references")
    
    # Handle edge case: no information found
    if not information_list:
        logger.warning("⚠️ No information found in browser state, returning empty summary")
        return {"current_summary": "No information was found during the browsing process."}

    # shuffle the information list
    random.shuffle(information_list)

    # split the information list into chunks of 10
    chunk_size = 10
    information_chunks = [information_list[i:i + chunk_size] for i in range(0, len(information_list), chunk_size)]
    
    logger.info(f"📊 Split {len(information_list)} pieces of information into {len(information_chunks)} chunks")
    
    # for each chunk, summarize the information, add to the summary list
    summaries = []
    
    for i, chunk in enumerate(information_chunks):
        logger.info(f"📝 Summarizing chunk {i+1}/{len(information_chunks)} with {len(chunk)} items")       
        # Format the information for the prompt
        formatted_info = "\n".join([f"- {info}" for info in chunk])
        
        # Create the summarize prompt
        prompt = summarize_prompt.format(
            question=get_user_question(state['messages']),
            sub_goal=state.get('current_sub_question', ''),
            list_of_information=formatted_info,
            current_date=get_current_date()
        )
        
        # Get summary from LLM
        try:
            summary_response = llm.with_structured_output(Summarizer).invoke([{"role": "user", "content": prompt}])
            summaries.append(summary_response.summary)
        except Exception as e:
            logger.error(f"❌ Error summarizing chunk {i+1}: {str(e)}")
            # Fallback: create a simple concatenated summary
            fallback_summary = f"Information from chunk {i+1}: " + "; ".join(chunk[:5])  # Take first 5 items
            summaries.append(fallback_summary)
        
        logger.info(f"✅ Completed summary for chunk {i+1}")
    
    # ensemble the summaries
    logger.info(f"🔄 Ensembling {len(summaries)} summaries into final summary")
    
    if len(summaries) == 1:
        final_summary = summaries[0]
        logger.info("📋 Only one summary, using it as final summary")
    else:
        # Format summaries for ensemble prompt
        formatted_summaries = "\n\n".join([f"Summary {i+1}:\n{summary}" for i, summary in enumerate(summaries)])
        
        # Create the ensemble prompt
        ensemble_prompt_text = ensemble_prompt.format(
            question=get_user_question(state['messages']),
            sub_goal=state.get('current_sub_question', ''),
            several_summaries=formatted_summaries,
            current_date=get_current_date(),
            current_summary=state.get('current_summary', '')
        )
        
        # Get final ensemble summary from LLM
        try:
            ensemble_response = llm.with_structured_output(Summarizer).invoke([{"role": "user", "content": ensemble_prompt_text}])
            final_summary = ensemble_response.summary
        except Exception as e:
            logger.error(f"❌ Error during ensemble summarization: {str(e)}")
            # Fallback: concatenate all summaries
            final_summary = "\n\n".join([f"Summary {i+1}: {summary}" for i, summary in enumerate(summaries)])
        
        logger.info("✅ Completed ensemble summarization")
    
    logger.info("🎉 Advanced summarizer process completed!")
    
    return {"current_summary": final_summary}

def next_sub_question_writer_with_information_gain(state: OverallState, config: RunnableConfig) -> OverallState:
    """
    This is a general next sub-question multi-writer block that first generates a set of sub-questions from different perspectives when the current summary is insufficient to answer the main question, then sorts the sub-question sets to maximum the Information Gain, and finally add it with verification conditions.
    """
    logger.info("❓ Generating next mult sub-question...")
    configurable = Configuration.from_runnable_config(config)
    llm = ChatQwen(model=configurable.next_sub_question_writer_model, api_key=DASHSCOPE_API_KEY)
    structured_llm_writer = llm.with_structured_output(NextSubQuestionMultiWriter)
    formatted_prompt = next_sub_question_multi_writer_prompt.format(question=get_user_question(state['messages']),
                                                    current_summary=state.get('current_summary', ''),
                                                    current_date=get_current_date(),
                                                    max_questions = MAX_Q)
    sub_question_sets = structured_llm_writer.invoke(formatted_prompt)
    logger.info(f"❓ New sub-question sets generated: {sub_question_sets.new_sub_question_set}")
    
    logger.info("❓ Sorting the sub-question sets to  maximum the Information Gain...")
    llm = ChatQwen(model=configurable.next_sub_question_writer_model, api_key=DASHSCOPE_API_KEY)
    structured_llm_sorter = llm.with_structured_output(NextSubQuestionChooser)
    formatted_prompt = next_sub_question_sorting_prompt.format(question=get_user_question(state['messages']),
                                                    current_summary=state.get('current_summary', ''),
                                                    sub_question_sets = sub_question_sets.new_sub_question_set,
                                                    current_date=get_current_date())
    result = structured_llm_sorter.invoke(formatted_prompt)
    logger.info(f"❓ New sub-question generated: {result.new_sub_question}")

    return {"current_sub_question": result.new_sub_question, "current_sub_question_iteration": 1}