import os
import argparse
import logging
import json
import glob
import shutil
import threading
import concurrent.futures
from typing import List, Dict, Any
from pathlib import Path

from agents import (
    PlannerAgent,
    RTLAgent,
    MergeAgent,
    SyntaxDebugAgent,
    SemanticDebugAgent,
    SectionSelectorAgent,
)
from utils import setup_logging, read_jsonl, save_output
from agents.backends import create_llm_client
from verification import VerilogVerifier

def run_agent_with_retry(agent, agent_name: str, inputs: Dict[str, Any], task_name: str, max_retries: int = 2) -> Dict[str, Any]:
    """Run agent with retry mechanism for specified agents
    
    Args:
        max_retries: Maximum number of attempts (e.g., max_retries=3 means run at most 3 times)
    """
    for attempt_num in range(1, max_retries + 1):
        try:
            if attempt_num > 1:
                console_print(task_name, agent_name.upper(), "warning", f"Retry attempt {attempt_num}/{max_retries}")
                agent.logger.warning(f"Retry attempt {attempt_num}/{max_retries}")
            inputs["task_name"] = task_name
            result = agent.run(inputs)
            
            if attempt_num > 1:
                console_print(task_name, agent_name.upper(), "success", f"Succeeded on attempt {attempt_num}")
                agent.logger.info(f"Succeeded on attempt {attempt_num}")
            
            return result
            
        except Exception as e:
            if attempt_num < max_retries:
                console_print(task_name, agent_name.upper(), "error", f"Attempt {attempt_num} failed: {str(e)[:100]}...")
                agent.logger.error(f"Attempt {attempt_num} failed: {e}")
                continue
            else:
                console_print(task_name, agent_name.upper(), "error", f"All {max_retries} attempts failed")
                agent.logger.error(f"All {max_retries} attempts failed. Final error: {e}")
                raise e

def assemble_document_from_sections(section_dict: Dict[str, str], section_ids: List[str], summary_dict: Dict[str, Any] = None) -> str:
    """
    Universal document assembly function that assembles documents based on selector-provided indices
    
    Args:
        section_dict: Complete document section dictionary
        section_ids: List of section IDs selected by selector
        summary_dict: Optional summary dictionary containing title and summary for each section
    
    Returns:
        Assembled document content with enhanced section information
    """
    if not section_ids:
        return ""
    
    selected_sections = []
    for section_id in section_ids:
        if section_id in section_dict:
            # Build enhanced section with title, summary and content
            section_header = f"=== Section {section_id} ==="
            
            # Add title if available
            if summary_dict and section_id in summary_dict:
                title = summary_dict[section_id].get('title', 'Unknown Title')
                section_header += f"\nTitle: {title}"
                
                # Add summary directly from loaded JSON
                section_data = summary_dict[section_id]
                summary_lines = []
                if 'high_level_summary' in section_data:
                    summary_lines.append(f"High-level: {section_data['high_level_summary']}")
                if 'low_level_summary' in section_data:
                    summary_lines.append(f"Low-level: {section_data['low_level_summary']}")
                summary = "\n".join(summary_lines) if summary_lines else 'No summary available'
                section_header += f"\nSummary: {summary}"
            
            section_header += "\nContent:"
            
            # Combine header with actual section content
            enhanced_section = f"{section_header}\n{section_dict[section_id]}"
            selected_sections.append(enhanced_section)
    
    return "\n\n" + "="*80 + "\n\n".join(selected_sections) + "\n" + "="*80 + "\n"

def request_document_selection(section_selector_agent, task_type: str, summary_dict: Dict[str, Any],
                             task_name: str, logger, **kwargs) -> List[str]:
    """
    Request document indexing from SectionSelectorAgent
    
    Args:
        section_selector_agent: SectionSelectorAgent instance
        task_type: Task type ("syntax_debug", "semantic_debug", "merge")
        summary_dict: Document section summary dictionary
        task_name: Task name
        logger: Logger instance
        **kwargs: Task-specific additional parameters
    
    Returns:
        List of selected section IDs
    """
    logger.info(f"Requesting document selection for {task_type}")
    
    try:
        # Build selector input
        selector_input = {
            "task_type": task_type,
            "summary_dict": summary_dict
        }
        
        # Add task-specific parameters
        if task_type in ["syntax_debug", "semantic_debug"]:
            selector_input["error_messages"] = kwargs.get("error_messages", "")
            selector_input["current_code"] = kwargs.get("current_code", "")
        elif task_type == "merge":
            selector_input["subproblems"] = kwargs.get("subproblems", [])
            selector_input["subproblem_code_fragments"] = kwargs.get("subproblem_code_fragments", [])
        
        # Call selector agent
        selection_result = run_agent_with_retry(
            section_selector_agent, "section_selector", selector_input, task_name, max_retries=2
        )
        
        relevant_sections = selection_result.get("relevant_section_ids", [])
        logger.info(f"Selected {len(relevant_sections)} sections for {task_type}: {relevant_sections}")
        return relevant_sections
        
    except Exception as e:
        logger.warning(f"Document selection failed for {task_type}: {e}, using no context")
        return []

def run_debug_with_iterations(syntax_debug_agent, semantic_debug_agent, section_selector_agent, verifier, code: str, task_name: str, 
                             verification_path: str, summary_dict: Dict[str, Any], section_dict: Dict[str, str], 
                             output_dir: str, max_iterations: int = 3) -> Dict[str, Any]:
    """Run debug process with separate syntax and semantic agents"""
    
    console_print(task_name, "DEBUG", "start")
    syntax_debug_agent.logger.info("Starting debug process with syntax/semantic separation")
    
    current_code = code
    debug_applied = False
    
    for iteration_num in range(1, max_iterations + 1):
        syntax_debug_agent.logger.info(f"Debug iteration {iteration_num}/{max_iterations}")
        
        # Run verification to check current code
        verification_result = verifier.verify_code(current_code, str(task_name), verification_path)
        syntax_debug_agent.logger.info(f"Verification result: syntax={verification_result['syntax']}, semantic={verification_result['semantic']}")
        
        # Check if code passes all tests
        if verification_result["syntax"] == 1 and verification_result["semantic"] == 1:
            syntax_debug_agent.logger.info("✅ Code verification passed!")
            if iteration_num == 1:
                console_print(task_name, "DEBUG", "success", f"✓ Passed without debug (initial verification)")
                debug_iterations_used = 0
            else:
                console_print(task_name, "DEBUG", "success", f"✓ Passed after {iteration_num - 1} debug iterations")
                debug_iterations_used = iteration_num - 1
            
            return {
                "success": True,
                "final_code": current_code,
                "iterations": debug_iterations_used,
                "debug_applied": debug_applied,
                "verification_result": verification_result
            }
        
        # Verification failed - apply debug fixes
        debug_applied = True
        
        # Separate syntax and semantic errors
        has_syntax_errors = verification_result.get("syntax", 1) == 0
        has_semantic_errors = verification_result.get("semantic", 1) == 0
        
        syntax_errors = verification_result.get("syntax_err", "") if has_syntax_errors else ""
        semantic_errors = verification_result.get("semantic_err", "") if has_semantic_errors else ""
        
        try:
            # Stage 1: Fix syntax errors first (if any)
            if has_syntax_errors:
                console_print(task_name, "SYNTAX_DEBUG", "start", f"Iteration {iteration_num}")
                
                # Request document selection
                relevant_section_ids = request_document_selection(
                    section_selector_agent, "syntax_debug", summary_dict, task_name, 
                    syntax_debug_agent.logger, error_messages=syntax_errors, current_code=current_code
                )
                
                # Assemble document
                document_fragments = assemble_document_from_sections(section_dict, relevant_section_ids, summary_dict)
                
                syntax_debug_input = {
                    "error_code": current_code,
                    "error_messages": syntax_errors,
                    "document_fragments": document_fragments,
                    "task_name": task_name
                }
                
                syntax_result = run_agent_with_retry(syntax_debug_agent, "syntax_debug", syntax_debug_input, task_name, max_retries=2)
                save_agent_log(output_dir, task_name, f"syntax_debug_{iteration_num}", syntax_debug_input, syntax_result)
                
                if syntax_result["success"]:
                    current_code = syntax_result["fixed_code"]
                    console_print(task_name, "SYNTAX_DEBUG", "success", f"Applied {len(syntax_result.get('fix_operations', []))} fixes")
                    syntax_debug_agent.logger.info(f"✅ Syntax debug applied fixes in iteration {iteration_num}")
                else:
                    console_print(task_name, "SYNTAX_DEBUG", "warning", "No fixes applied")
                    syntax_debug_agent.logger.warning(f"⚠️ Syntax debug failed in iteration {iteration_num}")
            
            # Stage 2: Fix semantic errors (if any and no syntax errors remain)
            elif has_semantic_errors:  # Only run semantic debug if syntax is clean
                console_print(task_name, "SEMANTIC_DEBUG", "start", f"Iteration {iteration_num}")
                
                # Request document selection
                relevant_section_ids = request_document_selection(
                    section_selector_agent, "semantic_debug", summary_dict, task_name,
                    semantic_debug_agent.logger, error_messages=semantic_errors, current_code=current_code
                )
                
                # Assemble document
                document_fragments = assemble_document_from_sections(section_dict, relevant_section_ids, summary_dict)
                
                semantic_debug_input = {
                    "error_code": current_code,
                    "error_messages": semantic_errors,
                    "document_fragments": document_fragments,
                    "task_name": task_name
                }
                
                semantic_result = run_agent_with_retry(semantic_debug_agent, "semantic_debug", semantic_debug_input, task_name, max_retries=2)
                save_agent_log(output_dir, task_name, f"semantic_debug_{iteration_num}", semantic_debug_input, semantic_result)
                
                if semantic_result["success"]:
                    current_code = semantic_result["fixed_code"]
                    console_print(task_name, "SEMANTIC_DEBUG", "success", f"Applied {len(semantic_result.get('fix_operations', []))} fixes")
                    semantic_debug_agent.logger.info(f"✅ Semantic debug applied fixes in iteration {iteration_num}")
                else:
                    console_print(task_name, "SEMANTIC_DEBUG", "warning", "No fixes applied")
                    semantic_debug_agent.logger.warning(f"⚠️ Semantic debug failed in iteration {iteration_num}")
                
        except Exception as e:
            syntax_debug_agent.logger.error(f"❌ Debug process failed with exception in iteration {iteration_num}: {e}")
            # Continue with current code for next iteration
    
    # Reached max iterations without success
    final_verification = verifier.verify_code(current_code, str(task_name), verification_path)
    final_success = final_verification["syntax"] == 1 and final_verification["semantic"] == 1
    
    if final_success:
        console_print(task_name, "DEBUG", "success", f"✓ Fixed after {max_iterations} iterations")
        syntax_debug_agent.logger.info("✅ Final verification passed after max iterations!")
    else:
        console_print(task_name, "DEBUG", "error", f"Failed after {max_iterations} iterations")
        syntax_debug_agent.logger.error("❌ Final verification failed after max iterations")
    
    return {
        "success": final_success,
        "final_code": current_code,
        "iterations": max_iterations,  # Used all available iterations
        "debug_applied": debug_applied,
        "verification_result": final_verification
    }

def parse_args() -> argparse.Namespace:
    parser = argparse.ArgumentParser(description="Complex Verilog Agent Pipeline")
    parser.add_argument("--input", nargs='+',
                       help="JSONL file path(s) containing problem text and optional id. Can specify multiple files.")
    parser.add_argument("--provider", choices=["anthropic", "openai", "vllm", "deepseek"], default="anthropic",
                       help="LLM provider type")
    parser.add_argument("--model", help="Model name")
    parser.add_argument("--temperature", type=float, default=0.6)
    parser.add_argument("--max_tokens", type=int, default=131072, help="Maximum generation tokens")
    parser.add_argument("--output_dir", default="./outputs", help="Output directory")
    parser.add_argument("--preprocess_dir", default="./preprocessed", help="Directory to load preprocessed summaries/sections if available")
    parser.add_argument(
        "--tokenizer_path",
        help="Optional tokenizer path for local models",
    )
    
    # Agent disable options
    # parser.add_argument("--disable_summarize", default=True, action="store_true", help="Disable summarize agent")
    parser.add_argument("--disable_planner", action="store_true", help="Disable planner agent")
    parser.add_argument("--disable_rtl", action="store_true", help="Disable RTL agent")
    parser.add_argument("--disable_merge", action="store_true", help="Disable merge agent")
    parser.add_argument("--disable_debug", action="store_true", help="Disable debug agent")
    
    parser.add_argument("--verification_dir", help="Verification files directory")
    parser.add_argument("--max_debug_iterations", type=int, default=10, help="Maximum debug iterations")
    
    # Multi-threading parameters
    parser.add_argument("--max_workers", type=int, default=8, help="Maximum number of worker threads")

    return parser.parse_args()

def create_agent_logger(task_name: str, agent_name: str, output_dir: str) -> logging.Logger:
    """Create detailed logger for each agent"""
    log_dir = os.path.join(output_dir, str(task_name), "logs")
    os.makedirs(log_dir, exist_ok=True)
    
    log_file = os.path.join(log_dir, f"{agent_name}.log")
    
    # Create logger
    logger = logging.getLogger(f"{task_name}_{agent_name}")
    logger.setLevel(logging.DEBUG)
    
    # Clear existing handlers
    for handler in logger.handlers[:]:
        logger.removeHandler(handler)
    
    # File handler for detailed logs
    file_handler = logging.FileHandler(log_file, mode='w')
    file_handler.setLevel(logging.DEBUG)
    file_formatter = logging.Formatter(
        '%(asctime)s - %(name)s - %(levelname)s - %(message)s'
    )
    file_handler.setFormatter(file_formatter)
    logger.addHandler(file_handler)
    
    return logger

def save_agent_log(output_dir: str, task_name: str, agent_name: str, input_data: Dict[str, Any], output_data: Dict[str, Any]):
    """Save agent input and output for logging and replay capability"""
    log_dir = os.path.join(output_dir, str(task_name), "agent_logs")
    os.makedirs(log_dir, exist_ok=True)
    
    # Save input
    input_file = os.path.join(log_dir, f"{agent_name}_input.json")
    save_output(input_file, json.dumps(input_data, indent=2, ensure_ascii=False))
    
    # Save output
    output_file = os.path.join(log_dir, f"{agent_name}_output.json")
    save_output(output_file, json.dumps(output_data, indent=2, ensure_ascii=False))

def load_agent_log(output_dir: str, task_name: str, agent_name: str, log_type: str) -> Dict[str, Any]:
    """Load agent input or output from previous runs"""
    log_dir = os.path.join(output_dir, str(task_name), "agent_logs")
    log_file = os.path.join(log_dir, f"{agent_name}_{log_type}.json")
    
    if os.path.exists(log_file):
        with open(log_file, 'r', encoding='utf-8') as f:
            return json.load(f)
    else:
        raise FileNotFoundError(f"Log file not found: {log_file}")

def console_print(task_name: str, stage: str, status: str, message: str = ""):
    """Smart console output for progress tracking"""
    # Only use green checkmark for test verification passed, use plain symbols for other successes
    if status == "success":
        # Check if this is a test verification passed situation
        if ("passed" in message.lower() or 
            stage in ["DEBUG", "VERIFICATION", "PERFECT", "SYNTAX_OK", "QUALITY_CHECK"] or
            "✓" in message or "verification passed" in message or "test passed" in message):
            symbol = "✅"
        else:
            # Use plain symbols for general success
            symbol = "◉"
    else:
        symbols = {"start": "◦", "error": "❌", "warning": "⚠️"}
        symbol = symbols.get(status, "ℹ️")
    
    print(f"[{task_name}] {stage}: {symbol}{' ' + message if message else ''}")

def load_all_problems(input_paths: List[str]) -> List[Dict[str, Any]]:
    """Load problems from multiple JSONL files"""
    all_problems = []
    
    for input_path in input_paths:
        file_paths = glob.glob(input_path) if '*' in input_path else [input_path]
        
        for file_path in file_paths:
            if os.path.exists(file_path):
                console_print("SYSTEM", "LOAD", "start", f"Loading {file_path}")
                problems = read_jsonl(file_path)
                console_print("SYSTEM", "LOAD", "success", f"Found {len(problems)} problems")
                all_problems.extend(problems)
            else:
                console_print("SYSTEM", "LOAD", "error", f"File not found: {file_path}")
    # need_list = ['sdc_controller', 'e203_biu', 'e203_core', 'e203_cpu', 'e203_cpu_top', 'e203_exu', 'e203_exu_alu', 'e203_exu_decode', 'e203_ifu_ifetch', 'e203_itcm_ctrl', 'e203_lsu_ctrl']
    # all_problems = [problem for problem in all_problems if problem["task"] in need_list]
    return all_problems

def create_agents(llm_client, task_name: str, output_dir: str):
    """Create all agents with individual loggers"""
    return {
        "planner": PlannerAgent(llm_client, create_agent_logger(task_name, "planner", output_dir)),
        "rtl": RTLAgent(llm_client, create_agent_logger(task_name, "rtl", output_dir)),
        "merge": MergeAgent(llm_client, create_agent_logger(task_name, "merge", output_dir)),
        "syntax_debug": SyntaxDebugAgent(llm_client, create_agent_logger(task_name, "syntax_debug", output_dir)),
        "semantic_debug": SemanticDebugAgent(
            llm_client,
            create_agent_logger(task_name, "semantic_debug", output_dir),
            output_dir=output_dir,
        ),
        "section_selector": SectionSelectorAgent(
            llm_client,
            create_agent_logger(task_name, "section_selector", output_dir),
            output_dir=output_dir,
        ),
    }

def determine_system_name(task_name: str) -> str:
    """Determine system name from task name"""
    task_lower = str(task_name).lower()
    if "aes" in task_lower:
        return "aes"
    elif "e203" in task_lower:
        return "e203_hbirdv2"
    elif "sd" in task_lower or "sdc" in task_lower:
        return "sdc"
    else:
        raise ValueError(f"Unknown task name prefix: {task_name}")

def get_verification_path(verification_dir: str, task_name: str, output_dir: str) -> str:
    """Get verification path for a specific task and copy files to output directory"""
    system_name = determine_system_name(task_name)
    source_verification_path = os.path.join(verification_dir, system_name, str(task_name), "verification")
    
    if not os.path.exists(source_verification_path):
        raise FileNotFoundError(f"Verification path not found: {source_verification_path}")
    
    # Create verification directory in output directory
    task_output_dir = os.path.join(output_dir, str(task_name))
    output_verification_dir = os.path.join(task_output_dir, "verification")
    os.makedirs(output_verification_dir, exist_ok=True)
    
    # Copy verification files to output directory
    for item_name in os.listdir(source_verification_path):
        source_item_path = os.path.join(source_verification_path, item_name)
        dest_item_path = os.path.join(output_verification_dir, item_name)
        
        if os.path.isfile(source_item_path):
            shutil.copy2(source_item_path, dest_item_path)
        elif os.path.isdir(source_item_path):
            if os.path.exists(dest_item_path):
                shutil.rmtree(dest_item_path)
            shutil.copytree(source_item_path, dest_item_path)
    
    return output_verification_dir



def process_single_problem(problem: Dict[str, Any], llm_client, 
                         output_dir: str, args) -> Dict[str, Any]:
    """Process a single problem through the agent pipeline"""
    
    task_name = problem["task"]
    document = problem["problem"]
    
    console_print(task_name, "START", "start", f"Document length: {len(document)}")
    
    # Create task output directory
    task_output_dir = os.path.join(output_dir, str(task_name))
    os.makedirs(task_output_dir, exist_ok=True)
    
    # Create agents with individual loggers
    agents = create_agents(llm_client, task_name, output_dir)
    
    try:
        # Stage 1: Load preprocessed data
        console_print(task_name, "LOAD", "start")
        pre_dir = os.path.join(args.preprocess_dir, str(task_name))
        pre_section_path = os.path.join(pre_dir, "section_dict.json")
        pre_summary_path = os.path.join(pre_dir, "summary_dict.json")

        with open(pre_section_path, 'r', encoding='utf-8') as f:
            section_dict = json.load(f)
        with open(pre_summary_path, 'r', encoding='utf-8') as f:
            summary_dict = json.load(f)
        for section_id in summary_dict:
            summary_dict[section_id]["summary"] = summary_dict[section_id]["high_level_summary"] + "\nMentioned items: " + summary_dict[section_id]["low_level_summary"]
        
        console_print(task_name, "LOAD", "success", f"Loaded {len(summary_dict)} sections")
        
        # Stage 2: Planning
        console_print(task_name, "PLANNER", "start")
        
        if not args.disable_planner:
            planner_input = {"section_dict": section_dict, "summary_dict": summary_dict}
            planning_result = run_agent_with_retry(agents["planner"], "planner", planner_input, task_name, max_retries=2)
            save_agent_log(output_dir, task_name, "planner", planner_input, planning_result)
            console_print(task_name, "PLANNER", "success", f"Generated {len(planning_result['subproblems'])} subproblems")
        else:
            console_print(task_name, "PLANNER", "warning", "Skipped - loading from log")
            planning_result = load_agent_log(output_dir, task_name, "planner", "output")
        
        pseudocode = planning_result["pseudocode"]
        subproblems = planning_result["subproblems"]
        
        # Stage 3: RTL implementation for each subproblem
        console_print(task_name, "RTL", "start", f"Processing {len(subproblems)} subproblems")
        
        if not args.disable_rtl:
            subproblem_code_fragments = []
            
            for i, subproblem in enumerate(subproblems):
                agents["rtl"].logger.info(f"Processing subproblem {i+1}/{len(subproblems)}: {subproblem['id']}")
                
                # Assemble subproblem document
                subproblem_document = assemble_document_from_sections(section_dict, subproblem["required_section_indexes"], summary_dict)
                
                # Run RTL agent
                rtl_input = {
                    "pseudocode": pseudocode,
                    "subproblem_description": subproblem["description"],
                    "subproblem_document": subproblem_document
                }
                rtl_result = run_agent_with_retry(agents["rtl"], "rtl", rtl_input, task_name, max_retries=2)
                save_agent_log(output_dir, task_name, f"rtl_{i+1}", rtl_input, rtl_result)
                
                subproblem_code_fragments.append(rtl_result["code_fragment"])
                
                # Save subproblem result
                save_output(os.path.join(task_output_dir, f"subproblem_{i+1}.v"), 
                           rtl_result["code_fragment"])
            
            console_print(task_name, "RTL", "success")
        else:
            console_print(task_name, "RTL", "warning", "Skipped - loading from log")
            subproblem_code_fragments = []
            for i in range(len(subproblems)):
                rtl_result = load_agent_log(output_dir, task_name, f"rtl_{i+1}", "output")
                subproblem_code_fragments.append(rtl_result["code_fragment"])
        
        # Stage 4: Merge results
        console_print(task_name, "MERGE", "start")
        
        if not args.disable_merge:
            # Use selector to choose merge-related documents
            merge_section_ids = request_document_selection(
                agents["section_selector"], "merge", summary_dict, task_name,
                agents["merge"].logger, subproblems=subproblems, 
                subproblem_code_fragments=subproblem_code_fragments
            )
            
            # Assemble merge documents
            merge_document = assemble_document_from_sections(section_dict, merge_section_ids, summary_dict)
            
            merge_input = {
                "subproblems": subproblems,
                "subproblem_code_fragments": subproblem_code_fragments,
                "merge_document": merge_document
            }
            merge_result = run_agent_with_retry(agents["merge"], "merge", merge_input, task_name, max_retries=2)
            save_agent_log(output_dir, task_name, "merge", merge_input, merge_result)
            console_print(task_name, "MERGE", "success")
        else:
            console_print(task_name, "MERGE", "warning", "Skipped - loading from log")
            merge_result = load_agent_log(output_dir, task_name, "merge", "output")
        
        final_code = merge_result["final_code"]
        
        # Save merge result
        save_output(os.path.join(task_output_dir, "merged_code.v"), final_code)
        
        # Stage 5: Debug (if enabled) - with controlled iterations and verification
        debug_result = None
        if not args.disable_debug and args.verification_dir:
            try:
                # Get verification path
                verification_path = get_verification_path(args.verification_dir, task_name, output_dir)
                
                # Create verifier
                verifier = VerilogVerifier(agents["syntax_debug"].logger)
                
                # Run debug process with controlled iterations
                debug_result = run_debug_with_iterations(
                    syntax_debug_agent=agents["syntax_debug"],
                    semantic_debug_agent=agents["semantic_debug"],
                    section_selector_agent=agents["section_selector"],
                    verifier=verifier,
                    code=final_code,
                    task_name=task_name,
                    verification_path=verification_path,
                    summary_dict=summary_dict,
                    section_dict=section_dict,
                    output_dir=output_dir,
                    max_iterations=args.max_debug_iterations
                )
                
                final_code = debug_result["final_code"]
                
                # Save debug results
                save_agent_log(output_dir, task_name, "debug_final", {"initial_code": final_code}, debug_result)
                    
            except Exception as e:
                console_print(task_name, "DEBUG", "error", f"Debug process failed: {str(e)}")
                agents["syntax_debug"].logger.error(f"Debug process failed: {e}")
                debug_result = {
                    "success": False,
                    "iterations": 0,
                    "debug_applied": False,
                    "error": str(e),
                    "verification_result": {"syntax": 0, "semantic": 0, "syntax_err": str(e), "semantic_err": str(e)}
                }
        
        # Save final code
        save_output(os.path.join(task_output_dir, "final_code.v"), final_code)
        
        console_print(task_name, "COMPLETE", "success")
        
        result = {
            "task": task_name,
            "status": "success",
            "final_code": final_code,
            "output_dir": task_output_dir
        }
        
        if debug_result:
            result["debug_success"] = debug_result["success"]
            result["debug_iterations"] = debug_result.get("iterations", 0)
            result["debug_applied"] = debug_result.get("debug_applied", False)
            
            # Add verification results for statistics
            verification_result = debug_result.get("verification_result", {})
            result["syntax_passed"] = verification_result.get("syntax", 0) == 1
            result["semantic_passed"] = verification_result.get("semantic", 0) == 1
            result["both_passed"] = result["syntax_passed"] and result["semantic_passed"]
        else:
            # If debug was disabled, we don't have verification results
            result["debug_success"] = None
            result["debug_iterations"] = 0
            result["debug_applied"] = False
            result["syntax_passed"] = None
            result["semantic_passed"] = None
            result["both_passed"] = None
        
        return result
        
    except Exception as e:
        console_print(task_name, "ERROR", "error", str(e))
        return {
            "task": task_name,
            "status": "error",
            "error": str(e),
            "output_dir": task_output_dir
        }

def process_problems_multithreaded(problems: List[Dict[str, Any]], llm_client_factory, 
                                 output_dir: str, args, max_workers: int) -> List[Dict[str, Any]]:
    """Process multiple problems using multithreading"""
    results = []
    
    def worker_process(problem):
        # Create a new LLM client for each thread to avoid conflicts
        thread_llm_client = llm_client_factory()
        return process_single_problem(problem, thread_llm_client, output_dir, args)
    
    with concurrent.futures.ThreadPoolExecutor(max_workers=max_workers) as executor:
        # Submit all tasks
        future_to_problem = {
            executor.submit(worker_process, problem): problem 
            for problem in problems
        }
        
        # Collect results as they complete
        for future in concurrent.futures.as_completed(future_to_problem):
            problem = future_to_problem[future]
            try:
                result = future.result()
                results.append(result)
                console_print("SYSTEM", "PROGRESS", "success", 
                             f"Completed {problem['task']} - Status: {result['status']}")
            except Exception as e:
                console_print("SYSTEM", "PROGRESS", "error", 
                             f"Failed {problem['task']}: {str(e)}")
                results.append({
                    "task": problem["task"],
                    "status": "error",
                    "error": str(e)
                })
    
    return results

def main():
    args = parse_args()
    
    # Setup basic logging
    logger = setup_logging()
    
    console_print("SYSTEM", "START", "start", "Complex Agent Pipeline")
    console_print("SYSTEM", "CONFIG", "start", f"Model: {args.model}, Workers: {args.max_workers}")
    
    # Show enabled/disabled agents
    agents_status = []
    # if not args.disable_summarize: agents_status.append("summarize")
    if not args.disable_planner: agents_status.append("planner") 
    if not args.disable_rtl: agents_status.append("rtl")
    if not args.disable_merge: agents_status.append("merge")
    if not args.disable_debug: agents_status.append("debug")
    console_print("SYSTEM", "AGENTS", "start", f"Enabled: {', '.join(agents_status)}")
    
    # Create output directory
    os.makedirs(args.output_dir, exist_ok=True)
    
    # Create LLM client factory for multithreading
    def create_llm_client_instance():
        return create_llm_client(
            provider=args.provider,
            model=args.model,
            temperature=args.temperature,
            max_tokens=args.max_tokens,
            tokenizer_path=args.tokenizer_path,
        )
    
    # Test LLM connection
    console_print("SYSTEM", "LLM", "start", f"{args.provider}/{args.model}")
    test_client = create_llm_client_instance()
    console_print("SYSTEM", "LLM", "success")
    
    # Read problems from all input files
    problems = load_all_problems(args.input)
    console_print("SYSTEM", "LOAD", "success", f"Total: {len(problems)} problems")
    
    if not problems:
        console_print("SYSTEM", "LOAD", "error", "No problems found")
        return
    
    # Process problems with multithreading
    console_print("SYSTEM", "PROCESSING", "start", f"Using {args.max_workers} workers")
    results = process_problems_multithreaded(
        problems, create_llm_client_instance, args.output_dir, 
        args, args.max_workers
    )
    
    # Save overall results with system-specific filename
    # Determine system name from first problem
    if results and results[0].get("task"):
        try:
            system_name = determine_system_name(results[0]["task"])
            results_filename = f"{system_name}_results.json"
        except:
            results_filename = "results.json"
    else:
        results_filename = "results.json"
    
    save_output(os.path.join(args.output_dir, results_filename), 
               json.dumps(results, indent=2, ensure_ascii=False))
    
    # Print execution statistics - Three key metrics (in descending quality order)
    total_tasks = len(results)
    
    if not args.disable_debug:
        # Calculate three key metrics
        results_with_verification = [r for r in results if r.get("both_passed") is not None]
        total_verified = len(results_with_verification) if results_with_verification else total_tasks
        
        # 1. Both syntax and semantic correct (highest quality)
        both_passed = sum(1 for r in results_with_verification if r.get("both_passed", False))
        both_passed_pct = (both_passed / total_verified * 100) if total_verified > 0 else 0
        
        # 2. Syntax correct (medium quality)
        syntax_passed = sum(1 for r in results_with_verification if r.get("syntax_passed", False))
        syntax_passed_pct = (syntax_passed / total_verified * 100) if total_verified > 0 else 0
        
        # 3. Pipeline normal (basic quality)
        pipeline_success = sum(1 for r in results if r["status"] == "success")
        pipeline_success_pct = (pipeline_success / total_tasks * 100) if total_tasks > 0 else 0
        
        # Output three metrics (in descending quality order)
        console_print("SYSTEM", "FINAL_RESULTS", "success", f"=== Final Quality Assessment ===")
        console_print("SYSTEM", "PERFECT", "success", f"Both Syntax & Semantic Correct: {both_passed}/{total_verified} ({both_passed_pct:.1f}%)")
        console_print("SYSTEM", "SYNTAX_OK", "success", f"Syntax Correct:                 {syntax_passed}/{total_verified} ({syntax_passed_pct:.1f}%)")
        console_print("SYSTEM", "PIPELINE_OK", "success", f"Pipeline Normal:                {pipeline_success}/{total_tasks} ({pipeline_success_pct:.1f}%)")
        
        # Verify metric ascending relationship
        if both_passed_pct <= syntax_passed_pct <= pipeline_success_pct:
            console_print("SYSTEM", "QUALITY_CHECK", "success", "✓ Quality metrics ascending relationship correct")
        else:
            console_print("SYSTEM", "QUALITY_CHECK", "warning", "⚠ Quality metrics ascending relationship abnormal")
    else:
        # Pipeline statistics only
        pipeline_success = sum(1 for r in results if r["status"] == "success")
        pipeline_success_pct = (pipeline_success / total_tasks * 100) if total_tasks > 0 else 0
        console_print("SYSTEM", "PIPELINE_OK", "success", f"Pipeline Normal: {pipeline_success}/{total_tasks} ({pipeline_success_pct:.1f}%)")

if __name__ == "__main__":
    main() 