from __future__ import annotations

from typing import List, Callable, Dict, Tuple, Optional, Any
import numpy as np
import types
import warnings
from collections import defaultdict
from joblib import Parallel, delayed
from joblib.parallel import effective_n_jobs
from joblib.externals.loky.process_executor import TerminatedWorkerError
import concurrent.futures
import time
import threading

from ...oracle import create_cvrp_oracle
from .solver.solve_instance import solve_instance, nearest_neighbor_fallback


def prepare_exec_namespace() -> Dict[str, Any]:
    """
    Prepare a namespace for exec() that includes numpy.
    
    Returns:
        Dictionary with numpy and other standard imports
    """
    namespace = {
        '__builtins__': __builtins__,
        'numpy': np,
        'np': np,
    }
    return namespace


def evaluate_single_solver_instance(
    solver_id: int,
    generator_id: int,
    instance: Dict,
    optimal_value: Optional[float],
    weight: float,  # Weight is included in task but not used in evaluation
    time_limit: int,
    solver_module,
    max_iterations: int = 1000,
    max_stagnation: int = 10,
    random_seed: Optional[int] = None
) -> Tuple[int, int, float]:
    """
    
    Args:
        solver_id: Solver ID
        generator_id: Generator ID
        instance: CVRP instance dict with 'depot', 'customers', 'vehicle_capacity'
        optimal_value: Optimal solution cost (for gap calculation)
        weight: Weight (not used in evaluation)
        time_limit: Solver time limit (seconds)
        solver_module: Compiled solver module (with select function)
        max_iterations: Maximum iterations (if applicable, not used for step-by-step)
        max_stagnation: Maximum stagnation rounds (if applicable, not used for step-by-step)
        random_seed: Random seed for deterministic behavior (not used currently)
        
    Returns:
        (solver_id, generator_id, gap)
    """
    try:
        # Get select function from module
        if not hasattr(solver_module, 'select'):
            return solver_id, generator_id, 1e9
        
        select_func = solver_module.select
        
        # Ensure instance has distance_matrix_int for consistency
        # This is needed for both solver and oracle to use the same distance matrix
        if 'distance_matrix_int' not in instance:
            from .solver.solve_instance import instance_to_solver_inputs
            instance_to_solver_inputs(instance)
        
        # Run solver with timeout protection
        effective_time_limit = float(time_limit) if time_limit > 0 else None
        if effective_time_limit is not None:
            timeout_seconds = effective_time_limit + 10.0
            
            def run_solver():
                return solve_instance(
                    instance=instance,
                    select_func=select_func,
                    fallback_select=nearest_neighbor_fallback,
                    time_limit=effective_time_limit
                )
            
            try:
                with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
                    future = executor.submit(run_solver)
                    solution_cost, route = future.result(timeout=timeout_seconds)
            except concurrent.futures.TimeoutError:
                print(f"      [CVRP Eval] Solver timeout for solver {solver_id}, generator {generator_id}", flush=True)
                return solver_id, generator_id, 1e9
            except Exception as e:
                print(f"      [CVRP Eval] Solver exception for solver {solver_id}, generator {generator_id}: {type(e).__name__}: {e}", flush=True)
                return solver_id, generator_id, 1e9
        else:
            try:
                solution_cost, route = solve_instance(
                    instance=instance,
                    select_func=select_func,
                    fallback_select=nearest_neighbor_fallback,
                    time_limit=None
                )
            except Exception as e:
                print(f"      [CVRP Eval] Solver exception (no timeout) for solver {solver_id}, generator {generator_id}: {type(e).__name__}: {e}", flush=True)
                return solver_id, generator_id, 1e9
        
        # Validate solution cost
        if not np.isfinite(solution_cost) or solution_cost < 0:
            # Get instance info for debugging
            num_customers = len(instance.get('customers', []))
            total_demand = sum(c.get('demand', 0) for c in instance.get('customers', []))
            vehicle_capacity = instance.get('vehicle_capacity', 0)
            print(f"      [CVRP Eval] Invalid solution_cost: {solution_cost} for solver {solver_id}, generator {generator_id}", flush=True)
            print(f"      [CVRP Eval] Instance info: num_customers={num_customers}, total_demand={total_demand}, vehicle_capacity={vehicle_capacity}", flush=True)
            return solver_id, generator_id, 1e9
        
        # Compute gap
        if optimal_value is not None and optimal_value > 0:
            if solution_cost < optimal_value:
                gap = 0.0
            else:
                gap = (solution_cost - optimal_value) / abs(optimal_value) * 100.0
        else:
            # Debug: log why gap is inf
            num_customers = len(instance.get('customers', []))
            total_demand = sum(c.get('demand', 0) for c in instance.get('customers', []))
            vehicle_capacity = instance.get('vehicle_capacity', 0)
            if optimal_value is None:
                print(f"      [CVRP Eval] optimal_value is None for solver {solver_id}, generator {generator_id}. Solution cost: {solution_cost}. Gap set to inf.", flush=True)
                print(f"      [CVRP Eval] Instance info: num_customers={num_customers}, total_demand={total_demand}, vehicle_capacity={vehicle_capacity}", flush=True)
                warnings.warn(
                    f"CVRP evaluation: optimal_value is None for solver {solver_id}, generator {generator_id}. "
                    f"Solution cost: {solution_cost}. Gap set to inf.",
                    UserWarning
                )
            elif optimal_value <= 0:
                print(f"      [CVRP Eval] optimal_value={optimal_value} <= 0 for solver {solver_id}, generator {generator_id}. Solution cost: {solution_cost}. Gap set to inf.", flush=True)
                print(f"      [CVRP Eval] Instance info: num_customers={num_customers}, total_demand={total_demand}, vehicle_capacity={vehicle_capacity}", flush=True)
                warnings.warn(
                    f"CVRP evaluation: optimal_value={optimal_value} <= 0 for solver {solver_id}, generator {generator_id}. "
                    f"Solution cost: {solution_cost}. Gap set to inf.",
                    UserWarning
                )
            gap = float('inf')
        
        return solver_id, generator_id, float(gap)
    except Exception as e:
        print(f"      [CVRP Eval] Exception in evaluate_single_solver_instance for solver {solver_id}, generator {generator_id}: {type(e).__name__}: {e}", flush=True)
        if hasattr(e, '__traceback__'):
            import traceback
            traceback.print_exc()
        return solver_id, generator_id, 1e9


def batch_evaluate_tasks(
    tasks: List[Tuple],
    evaluate_fn: Callable,
    n_jobs: int = -1,
    backend: str = "threading",
    prefer: str = "threads",
    timeout: Optional[float] = None,
    debug_mode: bool = False,
    track_time: bool = False,
    time_key: str = "solver"  # "solver" or "generator"
) -> Dict[Tuple[int, int], float]:
    """    
    Args:
        tasks: List of tasks to evaluate, each task is unpacked and passed to evaluate_fn
        evaluate_fn: Function to evaluate a single task
            Signature: fn(*task_args) -> (solver_id, generator_id, gap)
        n_jobs, backend, prefer, timeout: Parallel execution parameters
        debug_mode: Whether to print debug information
        
    Returns:
        Dictionary mapping (solver_id, generator_id) -> mean_gap (averaged over instances)
    """
    if len(tasks) == 0:
        return {}
    
    # Calculate effective workers
    workers = effective_n_jobs(n_jobs) if n_jobs > 0 else 1
    
    # Use fixed batch_size
    if backend == "loky":
        if workers > 32:
            batch_size = 1
        elif workers > 16:
            batch_size = max(1, workers // 16)
        else:
            batch_size = max(1, workers // 4)
    elif backend == "threading":
        batch_size = max(1, workers // 4)
    else:
        batch_size = max(1, workers // 2)
    
    parallel_kwargs = {
        'n_jobs': n_jobs,
        'backend': backend,
        'prefer': prefer,
        'batch_size': batch_size,
    }
    if n_jobs > 0:
        parallel_kwargs['pre_dispatch'] = max(1, n_jobs // 2)
    
    if timeout is not None and timeout > 0:
        parallel_kwargs['timeout'] = timeout
    else:
        default_timeout = len(tasks) * 60.0 / max(1, workers) * 1.5
        parallel_kwargs['timeout'] = max(default_timeout, 600.0)
        if debug_mode:
            print(f"      [BatchEval] No timeout specified, using default: {parallel_kwargs['timeout']:.1f}s", flush=True)
    
    if debug_mode:
        parallel_kwargs['verbose'] = 10
    
    if debug_mode:
        print(f"      [BatchEval] Starting evaluation: {len(tasks)} tasks, {workers} workers ({backend}/{prefer}), batch_size={batch_size}", flush=True)
    
    eval_start_time = time.time()
    
    def evaluate_with_timeout(*args, **kwargs):
        """Wrapper that adds timeout protection to each task"""
        try:
            return evaluate_fn(*args, **kwargs)
        except Exception as e:
            if len(args) >= 2:
                return args[0], args[1], 1e9
            return 0, 0, 1e9
    
    results = []
    timeout_flag = threading.Event()
    
    def timeout_monitor():
        """Monitor execution time and set timeout flag"""
        check_interval = 1.0
        while not timeout_flag.is_set():
            elapsed = time.time() - eval_start_time
            if timeout is not None and timeout > 0 and elapsed > timeout:
                timeout_flag.set()
                if debug_mode:
                    print(f"      [BatchEval] Timeout monitor triggered: {elapsed:.1f}s > {timeout:.1f}s", flush=True)
                break
            time.sleep(check_interval)
    
    monitor_thread = None
    if timeout is not None and timeout > 0:
        monitor_thread = threading.Thread(target=timeout_monitor, daemon=True)
        monitor_thread.start()
    
    try:
        with Parallel(**parallel_kwargs) as parallel_executor:
            results = parallel_executor(
                delayed(evaluate_with_timeout)(*task) for task in tasks
            )
        eval_time = time.time() - eval_start_time
        
        if timeout_flag.is_set():
            eval_time = time.time() - eval_start_time
            if debug_mode:
                print(f"      [BatchEval] WARNING: Timeout detected via monitor after {eval_time:.1f}s", flush=True)
        else:
            if debug_mode:
                print(f"      [BatchEval] Evaluation completed in {eval_time:.1f}s", flush=True)
    except (TimeoutError, concurrent.futures.TimeoutError, TerminatedWorkerError) as e:
        eval_time = time.time() - eval_start_time
        timeout_flag.set()
        if debug_mode:
            print(f"      [BatchEval] Timeout exception after {eval_time:.1f}s: {type(e).__name__}: {e}", flush=True)
        if not results:
            results = []
    except Exception as e:
        eval_time = time.time() - eval_start_time
        if debug_mode:
            print(f"      [BatchEval] Parallel evaluation failed after {eval_time:.1f}s: {e}", flush=True)
        if timeout is None or eval_time < timeout:
            try:
                results = [evaluate_fn(*task) for task in tasks]
            except Exception:
                results = []
        else:
            results = []
    
    if 'eval_time' not in locals():
        eval_time = time.time() - eval_start_time
    
    if track_time:
        try:
            from ....utils.evaluation_timer import get_timer
            timer = get_timer()
            if time_key == "solver":
                timer.add_solver_evaluation_time(eval_time)
            elif time_key == "generator":
                timer.add_generator_evaluation_time(eval_time)
        except Exception:
            pass
    
    if not results:
        if debug_mode:
            print(f"      [BatchEval] Warning: No results collected, returning empty dict", flush=True)
        return {}
    
    # Aggregate results by (solver_id, generator_id)
    results_dict = defaultdict(list)
    valid_results_count = 0
    for result in results:
        if result is None:
            continue
        try:
            solver_id, generator_id, gap = result
            if np.isfinite(gap) and gap < 1e8:
                results_dict[(solver_id, generator_id)].append(gap)
                valid_results_count += 1
            elif gap == float('inf'):
                results_dict[(solver_id, generator_id)].append(None)
                valid_results_count += 1
        except (ValueError, TypeError) as e:
            if debug_mode:
                print(f"      [BatchEval] Warning: Invalid result format: {result}, error: {e}", flush=True)
            continue
    
    if debug_mode and valid_results_count < len(tasks):
        print(f"      [BatchEval] Collected {valid_results_count}/{len(tasks)} valid results", flush=True)
    
    # Compute mean gap for each (solver_id, generator_id) pair
    mean_results = {}
    failed_pairs = []
    for (solver_id, generator_id), gaps in results_dict.items():
        if gaps:
            valid_gaps = [g for g in gaps if g is not None and np.isfinite(g) and g < 1e8]
            if valid_gaps:
                mean_gap = float(np.mean(valid_gaps))
                mean_results[(solver_id, generator_id)] = mean_gap
            else:
                # All gaps are invalid (None, inf, or >= 1e8)
                invalid_count = len([g for g in gaps if g is not None])
                inf_count = len([g for g in gaps if g == float('inf')])
                large_count = len([g for g in gaps if g is not None and g >= 1e8])
                failed_pairs.append((solver_id, generator_id, len(gaps), invalid_count, inf_count, large_count))
                mean_results[(solver_id, generator_id)] = None
    
    # Report failed evaluations
    if failed_pairs:
        print(f"      [BatchEval] WARNING: {len(failed_pairs)} (solver, generator) pairs have no valid gaps:", flush=True)
        for s_id, g_id, total, invalid, inf_cnt, large_cnt in failed_pairs:
            print(f"        (s{s_id}, g{g_id}): {total} total, {invalid} invalid, {inf_cnt} inf, {large_cnt} >=1e8", flush=True)
    
    return mean_results


def prepare_tasks(
    solver_codes: List[str],
    solver_ids: List[int],
    generator_codes: List[str],
    generator_ids: List[int],
    generator_weights: np.ndarray,
    n_instances: int,
    num_customers: int,
    vehicle_capacity: int,
    num_vehicles: Optional[int],
    time_limit: int,
    use_gap: bool,
    gap_oracle: str,
    oracle_timeout: int,
    optimal_parallel_n_jobs: Optional[int] = None,
    debug_mode: bool = False,
    cached_instances: Optional[List[List[Dict]]] = None,
    cached_oracle_costs: Optional[Dict[Tuple[int, int], float]] = None,
    config: Optional[Any] = None,
    max_iterations: int = 1000,
    max_stagnation: int = 10,
    random_seed: Optional[int] = None
) -> Tuple[List[Tuple], List[List[Dict]], Dict[Tuple[int, int], float]]:
    """
    统一的prepare_tasks函数：为所有(solver, generator)组合准备评估任务。
    
    Args:
        solver_codes: List of solver code strings
        solver_ids: List of solver IDs
        generator_codes: List of generator code strings
        generator_ids: List of generator IDs
        generator_weights: Array of weights for each generator
        n_instances: Number of instances to generate per generator
        num_customers: Number of customers
        vehicle_capacity: Vehicle capacity
        num_vehicles: Number of vehicles (optional)
        time_limit: Solver time limit (seconds)
        use_gap: Whether to compute gap (requires oracle)
        gap_oracle: Oracle type ("ortools" or "none")
        oracle_timeout: Timeout for oracle (seconds)
        optimal_parallel_n_jobs: Parallel jobs for oracle computation
        debug_mode: Whether to print debug information
        cached_instances: Cached instances (optional)
        cached_oracle_costs: Cached oracle costs (optional)
        config: Config object (optional)
        max_iterations: Maximum iterations (if applicable)
        max_stagnation: Maximum stagnation rounds (if applicable)
        
    Returns:
        Tuple of:
        - all_tasks: List of tasks
        - all_instances_by_gen: List[List[Dict]] - instances per generator (for caching)
        - optimal_costs_dict: Dict[(gen_id, inst_idx): optimal_value] - oracle costs (for caching)
    """
    prep_start_time = time.time()
    # Validate inputs
    if n_instances is None or n_instances <= 0:
        raise ValueError(f"prepare_tasks: n_instances must be a positive integer, got {n_instances}")
    if num_customers is None or num_customers <= 0:
        raise ValueError(f"prepare_tasks: num_customers must be a positive integer, got {num_customers}")
    
    n_instances = int(n_instances)
    time_limit = int(time_limit)
    num_customers = int(num_customers)
    
    prep_init_time = time.time() - prep_start_time
    if prep_init_time > 0.1:
        print(f"      [PrepareTasks] Function entry took {prep_init_time:.2f}s", flush=True)
    
    # Step 1: Generate instances from all generators
    if cached_instances is not None:
        all_instances_by_gen = cached_instances
    else:
        def generate_instances_for_single_generator(gen_id, gen_code):
            """Generate instances for a single generator"""
            try:
                with warnings.catch_warnings():
                    warnings.simplefilter("ignore")
                    gen_mod = types.ModuleType(f"generator_module_{gen_id}")
                    exec_namespace = prepare_exec_namespace()
                    exec_namespace.update(gen_mod.__dict__)
                    exec(gen_code, exec_namespace)
                    gen_mod.__dict__.update(exec_namespace)
                    
                    if not hasattr(gen_mod, "generate_instances"):
                        return []
                    
                    seeds = np.arange(n_instances, dtype=int)
                    instances = gen_mod.generate_instances(seeds, num_customers, vehicle_capacity)
                    
                    valid_instances = []
                    invalid_count = 0
                    for inst in instances:
                        if isinstance(inst, dict) and 'depot' in inst and 'customers' in inst:
                            # Validate instance
                            if len(inst['customers']) == num_customers:
                                valid_instances.append(inst)
                            else:
                                invalid_count += 1
                        else:
                            invalid_count += 1
                    
                    if invalid_count > 0:
                        print(f"      [PrepareTasks] Generator {gen_id}: {invalid_count}/{len(instances)} instances invalid (wrong format or num_customers)", flush=True)
                    return valid_instances
            except Exception as e:
                print(f"      [PrepareTasks] Generator {gen_id}: Exception generating instances: {type(e).__name__}: {e}", flush=True)
                return []
        
        # Generate instances in batches
        batch_size = 20
        n_generators = len(generator_codes)
        
        def _generate_with_id(args):
            """Wrapper for parallel execution"""
            idx, gen_id, gen_code = args
            try:
                instances = generate_instances_for_single_generator(gen_id, gen_code)
                return idx, instances
            except Exception:
                return idx, []
        
        all_instances_by_gen = [None] * n_generators
        
        if n_generators > 1:
            n_workers = min(batch_size, 16)
            n_batches = (n_generators + batch_size - 1) // batch_size
            if debug_mode:
                print(f"      [PrepareTasks] Generating instances from {n_generators} generators (in {n_batches} batches)...", flush=True)
            
            for batch_idx in range(n_batches):
                start_idx = batch_idx * batch_size
                end_idx = min(start_idx + batch_size, n_generators)
                batch_generator_ids = generator_ids[start_idx:end_idx]
                batch_generator_codes = generator_codes[start_idx:end_idx]
                
                try:
                    with Parallel(
                        n_jobs=n_workers,
                        backend="loky",
                        prefer="processes",
                        verbose=0,
                        timeout=10.0
                    ) as parallel_executor:
                        results = parallel_executor(
                            delayed(_generate_with_id)((start_idx + i, gen_id, gen_code))
                            for i, (gen_id, gen_code) in enumerate(zip(batch_generator_ids, batch_generator_codes))
                        )
                    for idx, instances in results:
                        all_instances_by_gen[idx] = instances
                except Exception:
                    for i in range(start_idx, end_idx):
                        all_instances_by_gen[i] = []
        else:
            gen_id, gen_code = generator_ids[0], generator_codes[0]
            instances = generate_instances_for_single_generator(gen_id, gen_code)
            all_instances_by_gen = [instances]
    
    # Step 2: Compute oracle (optimal value) for all instances
    all_instances_with_metadata = []
    for gen_idx, gen_id in enumerate(generator_ids):
        inst_list = all_instances_by_gen[gen_idx]
        for inst_idx, instance in enumerate(inst_list):
            all_instances_with_metadata.append((gen_id, inst_idx, instance))
    
    optimal_costs_dict = {}
    if cached_oracle_costs is not None:
        optimal_costs_dict = cached_oracle_costs
    elif use_gap and len(all_instances_with_metadata) > 0:
        try:
            oracle_n_jobs = optimal_parallel_n_jobs if (optimal_parallel_n_jobs is not None) else -1
            oracle_workers = effective_n_jobs(oracle_n_jobs)
            if debug_mode:
                print(f"      [PrepareTasks] Computing oracle for {len(all_instances_with_metadata)} instances using {oracle_workers} workers...", flush=True)
            
            def compute_single_oracle_cost(gen_id_inst_idx_instance):
                """Compute oracle cost for a single instance"""
                gen_id, inst_idx, instance = gen_id_inst_idx_instance
                try:
                    # Ensure instance has distance_matrix_int for oracle consistency
                    # This is done by instance_to_solver_inputs in solve_instance, but oracle needs it too
                    if 'distance_matrix_int' not in instance:
                        from .solver.solve_instance import instance_to_solver_inputs
                        # This will add distance_matrix_int and distance_scale to instance
                        instance_to_solver_inputs(instance)
                    
                    if config is not None:
                        oracle = create_cvrp_oracle(
                            config=config,
                            oracle_type=gap_oracle,
                        )
                    else:
                        oracle = create_cvrp_oracle(oracle_type=gap_oracle)
                    
                    result = oracle.solve_oracle(instance)
                    if result is None:
                        num_customers = len(instance.get('customers', []))
                        total_demand = sum(c.get('demand', 0) for c in instance.get('customers', []))
                        vehicle_capacity = instance.get('vehicle_capacity', 0)
                        print(f"      [PrepareTasks] Oracle returned None for generator {gen_id}, instance {inst_idx}", flush=True)
                        print(f"      [PrepareTasks] Instance info: num_customers={num_customers}, total_demand={total_demand}, vehicle_capacity={vehicle_capacity}", flush=True)
                        return None
                    cost = result.get("cost")
                    status = result.get("status", "UNKNOWN")
                    solver_name = result.get("solver", "unknown")
                    if cost is None:
                        num_customers = len(instance.get('customers', []))
                        total_demand = sum(c.get('demand', 0) for c in instance.get('customers', []))
                        vehicle_capacity = instance.get('vehicle_capacity', 0)
                        print(f"      [PrepareTasks] Oracle returned cost=None, status={status} for generator {gen_id}, instance {inst_idx}", flush=True)
                        print(f"      [PrepareTasks] Instance info: num_customers={num_customers}, total_demand={total_demand}, vehicle_capacity={vehicle_capacity}", flush=True)
                        return None
                    if not np.isfinite(cost) or cost <= 0:
                        num_customers = len(instance.get('customers', []))
                        total_demand = sum(c.get('demand', 0) for c in instance.get('customers', []))
                        vehicle_capacity = instance.get('vehicle_capacity', 0)
                        print(f"      [PrepareTasks] Oracle returned invalid cost={cost}, status={status} for generator {gen_id}, instance {inst_idx}", flush=True)
                        print(f"      [PrepareTasks] Instance info: num_customers={num_customers}, total_demand={total_demand}, vehicle_capacity={vehicle_capacity}", flush=True)
                        return None
                    return cost
                except Exception as e:
                    num_customers = len(instance.get('customers', []))
                    total_demand = sum(c.get('demand', 0) for c in instance.get('customers', []))
                    vehicle_capacity = instance.get('vehicle_capacity', 0)
                    print(f"      [PrepareTasks] Oracle exception for generator {gen_id}, instance {inst_idx}: {type(e).__name__}: {e}", flush=True)
                    print(f"      [PrepareTasks] Instance info: num_customers={num_customers}, total_demand={total_demand}, vehicle_capacity={vehicle_capacity}", flush=True)
                    return None
            
            oracle_start_time = time.time()
            try:
                with Parallel(
                    n_jobs=oracle_n_jobs,
                    backend="loky",
                    prefer="processes",
                    batch_size="auto",
                    verbose=10 if debug_mode else 0,
                ) as parallel_executor:
                    optimal_costs_list = parallel_executor(
                        delayed(compute_single_oracle_cost)((gen_id, inst_idx, instance))
                        for gen_id, inst_idx, instance in all_instances_with_metadata
                    )
                for (gen_id, inst_idx, _), optimal_cost in zip(all_instances_with_metadata, optimal_costs_list):
                    optimal_costs_dict[(gen_id, inst_idx)] = optimal_cost
            except Exception:
                pass
            finally:
                oracle_time = time.time() - oracle_start_time
                if debug_mode:
                    print(f"      [PrepareTasks] Oracle computation completed in {oracle_time:.1f}s", flush=True)
        except Exception:
            pass
    
    # Step 3: Pre-compile all solver modules
    solver_modules = []
    
    def compile_solver(solver_id, solver_code):
        """Compile a single solver with timeout protection"""
        def _compile():
            try:
                with warnings.catch_warnings():
                    warnings.simplefilter("ignore")
                    solver_module = types.ModuleType(f"solver_module_{solver_id}")
                    exec_namespace = prepare_exec_namespace()
                    exec_namespace.update(solver_module.__dict__)
                    exec(solver_code, exec_namespace)
                    solver_module.__dict__.update(exec_namespace)
                    return solver_module
            except Exception:
                return None
        
        try:
            with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
                future = executor.submit(_compile)
                return future.result(timeout=10.0)
        except (concurrent.futures.TimeoutError, Exception):
            return None
    
    for solver_id, solver_code in zip(solver_ids, solver_codes):
        solver_modules.append(compile_solver(solver_id, solver_code))
    
    # Step 4: Generate all tasks
    # Format: (solver_id, generator_id, instance, optimal_value, weight, time_limit, solver_module, max_iterations, max_stagnation, random_seed)
    all_tasks = []
    for solver_idx, solver_id in enumerate(solver_ids):
        if solver_modules[solver_idx] is None:
            continue
        
        solver_module = solver_modules[solver_idx]
        
        # Check if select function exists
        if not hasattr(solver_module, 'select'):
            if debug_mode:
                print(f"      [PrepareTasks] Warning: Solver {solver_id} missing 'select' function, skipping", flush=True)
            continue
        
        for gen_idx, gen_id in enumerate(generator_ids):
            inst_list = all_instances_by_gen[gen_idx]
            weight = generator_weights[gen_idx] if gen_idx < len(generator_weights) else 0.0
            
            for inst_idx, instance in enumerate(inst_list):
                # Ensure instance has required fields
                if 'vehicle_capacity' not in instance:
                    instance['vehicle_capacity'] = vehicle_capacity
                if 'num_vehicles' not in instance and num_vehicles is not None:
                    instance['num_vehicles'] = num_vehicles
                
                optimal_value = optimal_costs_dict.get((gen_id, inst_idx), None)
                all_tasks.append((
                    solver_id, gen_id, instance, optimal_value, weight,
                    time_limit, solver_module, max_iterations, max_stagnation, random_seed
                ))
    
    return all_tasks, all_instances_by_gen, optimal_costs_dict




