from __future__ import annotations

from typing import List, Callable, Dict, Tuple, Optional
import numpy as np
import types
import warnings
from collections import defaultdict
from joblib import Parallel, delayed
from joblib.parallel import effective_n_jobs
from joblib.externals.loky.process_executor import TerminatedWorkerError
import concurrent.futures
import time
import threading

from .gls.gls_run import solve_instance
from .eval_utils import coords_to_matrix


def evaluate_single_solver_instance(
    solver_id: int,
    generator_id: int,
    coords: np.ndarray,
    optimal_cost: Optional[float],
    weight: float,  # Weight is included in task but not used in evaluation
    time_limit: int,
    ite_max: int,
    perturbation_moves: int,
    heuristic_module
) -> Tuple[int, int, float]:
    """
    evaluate single (solver, generator_instance) combination.
    
    this is a unified evaluation function, both solver and generator use this function.
    
    Args:
        solver_id: Solver ID
        generator_id: Generator ID
        coords: Instance coordinates
        optimal_cost: Optimal cost (for gap calculation)
        time_limit, ite_max, perturbation_moves: GLS parameters
        heuristic_module: compiled heuristic module
        
    Returns:
        Tuple[int, int, float]: (solver_id, generator_id, gap)
    """
    try:
        dis_matrix = coords_to_matrix(coords)
        opt_cost = float(optimal_cost) if (optimal_cost is not None) else np.nan
        gap = solve_instance(
            -1, opt_cost, dis_matrix, coords,
            int(time_limit), int(ite_max), int(perturbation_moves),
            heuristic_module
        )
        return solver_id, generator_id, float(gap)
    except Exception as e:
        return solver_id, generator_id, 1e9


def batch_evaluate_tasks(
    tasks: List[Tuple],
    evaluate_fn: Callable,
    n_jobs: int = -1,
    backend: str = "loky",  
    prefer: str = "processes",  
    timeout: Optional[float] = None,
    debug_mode: bool = False,
    track_time: bool = False,
    time_key: str = "solver",  # "solver" or "generator"
    task_batch_size: Optional[int] = None,
) -> Dict[Tuple[int, int], float]:
    """
    unified batch evaluation function: parallel evaluate all tasks, average by (solver_id, generator_id) and return.
    
    Args:
        tasks: List of tasks to evaluate, each task is unpacked and passed to evaluate_fn
        evaluate_fn: Function to evaluate a single task
            Signature: fn(*task_args) -> (solver_id, generator_id, gap)
        n_jobs, backend, prefer, timeout: Parallel execution parameters
        task_batch_size: Max number of tasks per internal Parallel call (None = all tasks)
        debug_mode: Whether to print debug information
        
    Returns:
        Dictionary mapping (solver_id, generator_id) -> mean_gap (averaged over instances)
    """
    if len(tasks) == 0:
        return {}
    
    parallel_kwargs = {
        'n_jobs': n_jobs,
        'backend': backend,
        'prefer': prefer,
        'batch_size': "auto",
    }
    # Only set pre_dispatch if n_jobs > 0, otherwise let joblib use default
    if n_jobs > 0:
        parallel_kwargs['pre_dispatch'] = "2*n_jobs"
    if timeout is not None:
        parallel_kwargs['timeout'] = timeout
    
    if debug_mode:
        workers = effective_n_jobs(n_jobs)
        print(f"[BatchEval] tasks={len(tasks)}, backend={backend}, n_jobs={n_jobs} -> workers={workers}")
        parallel_kwargs['verbose'] = 10
    
    # Track evaluation time if requested
    eval_start_time = time.time()
    
    # initialize CPU monitoring (for prepare task batch eval part)
    cpu_usage_percent = None
    try:
        import psutil
        # 初始化CPU percent counter（非阻塞）
        psutil.cpu_percent(interval=None)
    except Exception:
        pass
    
    # batch execute, avoid submitting large tasks at once
    effective_batch_size = (
        task_batch_size if (task_batch_size is not None and task_batch_size > 0) else len(tasks)
    )
    effective_batch_size = max(1, effective_batch_size)
    n_batches = (len(tasks) + effective_batch_size - 1) // effective_batch_size
    
    # calculate timeout for each batch
    batch_timeout = None
    if timeout is not None:
        # allocate timeout for each batch, leave some buffer
        batch_timeout = timeout / n_batches * 1.2  # allocate 20% more time for each batch as buffer
    else:
        # if no total timeout is specified, set default timeout for each batch (based on task count estimation)
        # assume each task takes at most 60 seconds
        batch_timeout = len(tasks) * 60.0 / max(1, effective_n_jobs(n_jobs)) / n_batches * 1.5
        batch_timeout = max(batch_timeout, 300.0)  # at least 5 minutes
    
    all_results = []
    try:
        for batch_idx in range(n_batches):
            start = batch_idx * effective_batch_size
            end = min(start + effective_batch_size, len(tasks))
            batch_tasks = tasks[start:end]
            
            batch_start_time = time.time()
            
            if debug_mode:
                print(f"      [BatchEval] Running task batch {batch_idx + 1}/{n_batches} (size={len(batch_tasks)}, timeout={batch_timeout:.1f}s)")
            
            batch_results = []
            batch_timeout_flag = threading.Event()
            
            def batch_timeout_monitor():
                """monitor batch timeout"""
                elapsed = time.time() - batch_start_time
                while elapsed < batch_timeout and not batch_timeout_flag.is_set():
                    time.sleep(1.0)
                    elapsed = time.time() - batch_start_time
                if elapsed >= batch_timeout and not batch_timeout_flag.is_set():
                    batch_timeout_flag.set()
                    if debug_mode:
                        print(f"      [BatchEval] Batch {batch_idx + 1}/{n_batches} timeout detected after {elapsed:.1f}s", flush=True)
            
            # start timeout monitor thread
            monitor_thread = None
            if batch_timeout is not None and batch_timeout > 0:
                monitor_thread = threading.Thread(target=batch_timeout_monitor, daemon=True)
                monitor_thread.start()
            
            try:
                # set timeout parameters for batch
                batch_parallel_kwargs = parallel_kwargs.copy()
                batch_parallel_kwargs['timeout'] = batch_timeout
                
                # use ThreadPoolExecutor to wrap Parallel call, ensure forced interruption after timeout
                def run_parallel():
                    """run Parallel in separate thread, so it can be interrupted after timeout"""
                    with Parallel(**batch_parallel_kwargs) as parallel_executor:
                        return parallel_executor(
                            delayed(evaluate_fn)(*task) for task in batch_tasks
                        )
                
                # use ThreadPoolExecutor to implement forced timeout
                with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
                    future = executor.submit(run_parallel)
                    try:
                        batch_results = future.result(timeout=batch_timeout)
                        batch_timeout_flag.set()  # mark completion
                    except concurrent.futures.TimeoutError:
                        # cancel task after timeout
                        batch_timeout_flag.set()
                        future.cancel()
                        # wait for a short time to let cancellation take effect
                        try:
                            concurrent.futures.wait([future], timeout=2.0)
                        except Exception:
                            pass
                        # raise timeout exception, let outer catch handle it
                        raise TimeoutError(f"Batch {batch_idx + 1} exceeded timeout {batch_timeout:.1f}s")
                
                batch_time = time.time() - batch_start_time
                if debug_mode:
                    print(f"      [BatchEval] Batch {batch_idx + 1}/{n_batches} completed in {batch_time:.1f}s ({len(batch_results)} results)")
                
            except (TimeoutError, concurrent.futures.TimeoutError, TerminatedWorkerError) as e:
                batch_timeout_flag.set()
                batch_time = time.time() - batch_start_time
                if debug_mode:
                    print(f"      [BatchEval] Batch {batch_idx + 1}/{n_batches} timeout after {batch_time:.1f}s: {type(e).__name__}", flush=True)
                    print(f"      [BatchEval] Skipping remaining tasks in this batch and continuing...", flush=True)
                # skip this batch after timeout, continue with next batch
                # return error results for incomplete tasks
                batch_results = []
                for task in batch_tasks:
                    # try to extract solver_id and generator_id
                    try:
                        solver_id = task[0]
                        generator_id = task[1]
                        batch_results.append((solver_id, generator_id, 1e9))  
                    except (IndexError, TypeError):
                        batch_results.append((0, 0, 1e9))
                
            except Exception as e:
                batch_timeout_flag.set()
                batch_time = time.time() - batch_start_time
                if debug_mode:
                    print(f"      [BatchEval] Batch {batch_idx + 1}/{n_batches} failed after {batch_time:.1f}s: {type(e).__name__}: {e}", flush=True)
                    # only try sequential fallback if not timed out
                    if batch_time < batch_timeout:
                        print(f"      [BatchEval] Attempting sequential fallback for batch {batch_idx + 1}/{n_batches}...", flush=True)
                        try:
                            batch_results = [evaluate_fn(*task) for task in batch_tasks]
                            if debug_mode:
                                print(f"      [BatchEval] Sequential fallback succeeded for batch {batch_idx + 1}/{n_batches}", flush=True)
                        except Exception as e2:
                            if debug_mode:
                                print(f"      [BatchEval] Sequential fallback also failed: {e2}", flush=True)
                            batch_results = []
                            for task in batch_tasks:
                                try:
                                    solver_id = task[0]
                                    generator_id = task[1]
                                    batch_results.append((solver_id, generator_id, 1e9))
                                except (IndexError, TypeError):
                                    batch_results.append((0, 0, 1e9))
                    else:
                        batch_results = []
                        for task in batch_tasks:
                            try:
                                solver_id = task[0]
                                generator_id = task[1]
                                batch_results.append((solver_id, generator_id, 1e9))
                            except (IndexError, TypeError):
                                batch_results.append((0, 0, 1e9))
                else:
                    batch_results = []
                    for task in batch_tasks:
                        try:
                            solver_id = task[0]
                            generator_id = task[1]
                            batch_results.append((solver_id, generator_id, 1e9))
                        except (IndexError, TypeError):
                            batch_results.append((0, 0, 1e9))
            
            finally:
                batch_timeout_flag.set()
            
            all_results.extend(batch_results)
    finally:
        eval_time = time.time() - eval_start_time
        
        try:
            import psutil
            if eval_time > 0.1:  
                cpu_usage_percent = psutil.cpu_percent(interval=None)
                if cpu_usage_percent == 0.0 and eval_time < 1.0:
                    cpu_usage_percent = psutil.cpu_percent(interval=0.1)
        except Exception:
            cpu_usage_percent = None
        
        if track_time:
            try:
                from ...utils.evaluation_timer import get_timer
                timer = get_timer()
                if time_key == "solver":
                    timer.add_solver_time(eval_time)
                elif time_key == "generator":
                    timer.add_generator_time(eval_time)
            except Exception:
                pass  # Silently fail if timer not available
    
    import sys
    sys.modules[__name__].__dict__['_last_batch_eval_cpu_usage'] = cpu_usage_percent
    
    sums_by_pair = defaultdict(float)
    counts_by_pair = defaultdict(int)
    
    for solver_id, generator_id, gap in all_results:
        if np.isfinite(gap):
            sums_by_pair[(solver_id, generator_id)] += float(gap)
            counts_by_pair[(solver_id, generator_id)] += 1
    
    results_dict = {}
    for (solver_id, generator_id), total in sums_by_pair.items():
        cnt = counts_by_pair[(solver_id, generator_id)]
        if cnt > 0:
            results_dict[(solver_id, generator_id)] = total / cnt
        else:
            results_dict[(solver_id, generator_id)] = 1e9
    
    if debug_mode:
        print(f"      [BatchEval] Aggregated to {len(results_dict)} (solver, generator) pairs")
    
    return results_dict


def prepare_tasks(
    solver_codes: List[str],
    solver_ids: List[int],
    generator_codes: List[str],
    generator_ids: List[int],
    generator_weights: np.ndarray,
    n_instances: int,
    n_cities: int,
    time_limit: int,
    ite_max: int,
    perturbation_moves: int,
    use_gap: bool,
    gap_oracle: str,  
    oracle_timeout: int,  
    lkh_runs: Optional[int] = None,
    optimal_parallel_n_jobs: Optional[int] = None,
    debug_mode: bool = False,
    cached_instances: Optional[List[List[np.ndarray]]] = None,
    cached_oracle_costs: Optional[Dict[Tuple[int, int], float]] = None,
    lkh3_path: Optional[str] = None,
    concorde_path: Optional[str] = None
) -> List[Tuple]:
    """
    unified prepare_tasks function: prepare evaluation tasks for all (solver, generator) combinations.
     
    Args:
        solver_codes: List of solver code strings
        solver_ids: List of solver IDs (index of solver_codes)
        generator_codes: List of generator code strings
        generator_ids: List of generator IDs (index of generator_codes)
        generator_weights: Array of weights for each generator (index of generator_ids)
        n_instances: Number of instances to generate per generator
        n_cities: Number of cities in TSP instances
        time_limit, ite_max, perturbation_moves: GLS parameters
        use_gap: Whether to compute gap (requires oracle)
        gap_oracle: Oracle type ("lkh3", "concorde", "none")
        oracle_timeout: Timeout for oracle (seconds)
        lkh_runs: LKH runs (optional)
        debug_mode: Whether to print debug information
        
    Returns:
        Tuple of:
        - all_tasks: List of tasks: (solver_id, generator_id, coords, optimal_cost, weight, time_limit, ite_max, perturbation_moves, heuristic_module)
        - all_coords_by_gen: List[List[np.ndarray]] - instances per generator (for caching)
        - optimal_costs_dict: Dict[(gen_id, inst_idx): optimal_cost] - oracle costs (for caching)
    """
    # Validate and convert to int
    if n_instances is None or n_instances <= 0:
        raise ValueError(f"prepare_tasks: n_instances must be a positive integer, got {n_instances}")
    if n_cities is None or n_cities <= 0:
        raise ValueError(f"prepare_tasks: n_cities must be a positive integer, got {n_cities}")
    
    n_instances = int(n_instances)
    time_limit = int(time_limit)
    ite_max = int(ite_max)
    perturbation_moves = int(perturbation_moves)
    n_cities = int(n_cities)
    
    if debug_mode:
        print(f"[PrepareTasks] Starting: {len(solver_codes)} solvers, {len(generator_codes)} generators, {n_instances} instances/gen")
        print(f"[PrepareTasks] Parameters: time_limit={time_limit}, ite_max={ite_max}, perturbation_moves={perturbation_moves}, n_cities={n_cities}")
    
    # Step 1: batch generate all generator instances (if not provided cached instances)
    if cached_instances is not None:
        # use cached instances
        all_coords_by_gen = cached_instances
        if debug_mode:
            total_cached = sum(len(coords_list) for coords_list in cached_instances)
            print(f"[PrepareTasks] Using cached instances: {total_cached} instances from {len(cached_instances)} generators")
    else:
        # generate new instances (parallelize to improve efficiency)
        def generate_instances_for_single_generator(gen_id, gen_code):
            """generate instances for single generator"""
            try:
                with warnings.catch_warnings():
                    warnings.simplefilter("ignore")
                    gen_mod = types.ModuleType(f"generator_module_{gen_id}")
                    exec(gen_code, gen_mod.__dict__)
                    
                    if not hasattr(gen_mod, "generate_instances"):
                        if debug_mode:
                            print(f"      [PrepareTasks] ERROR: Generator {gen_id} has no generate_instances function")
                        return []
                    
                    seeds = np.arange(n_instances, dtype=int)
                    coords_list = gen_mod.generate_instances(seeds, n_cities)
                    
                    # Validate coordinates
                    valid_coords = []
                    for coords in coords_list:
                        if coords.min() >= 0 and coords.max() <= 1:
                            valid_coords.append(coords)
                        elif debug_mode:
                            print(f"      [PrepareTasks] Generator {gen_id} produced invalid coordinates")
                    return valid_coords
            except Exception as e:
                if debug_mode:
                    print(f"      [PrepareTasks] Error generating instances for generator {gen_id}: {e}")
                return []
        
        # parallel generate all generator instances
        if len(generator_codes) > 1:
            # multiple generators when parallel generate (use loky backend to support timeout, avoid blocking)
            timeout_per_generator = 10.0
            total_timeout = timeout_per_generator * len(generator_codes) + 5  # additional 5 seconds buffer
            try:
                # limit parallel degree of instance generation, avoid over-parallelization (usually generator count is not many)
                instance_gen_n_jobs = min(len(generator_codes), 8) if len(generator_codes) > 1 else 1
                all_coords_by_gen = Parallel(
                    n_jobs=instance_gen_n_jobs, 
                    backend="loky", 
                    prefer="processes",
                    timeout=total_timeout
                )(
                    delayed(generate_instances_for_single_generator)(gen_id, gen_code)
                    for gen_id, gen_code in zip(generator_ids, generator_codes)
                )
            except Exception as e:
                if debug_mode:
                    print(f"      [PrepareTasks] Parallel instance generation failed or timeout: {e}")
                    print(f"      [PrepareTasks] Falling back to sequential generation with timeout protection")
                all_coords_by_gen = []
                timeout_per_generator = 10.0
                
                for gen_id, gen_code in zip(generator_ids, generator_codes):
                    try:
                        result_container = {'result': None, 'done': False, 'exception': None}
                        
                        def run_generator():
                            try:
                                result_container['result'] = generate_instances_for_single_generator(gen_id, gen_code)
                            except Exception as e:
                                result_container['exception'] = e
                            finally:
                                result_container['done'] = True
                        
                        thread = threading.Thread(target=run_generator, daemon=True)
                        thread.start()
                        thread.join(timeout=timeout_per_generator)
                        
                        if thread.is_alive():
                            # thread is still running, timed out
                            if debug_mode:
                                print(f"      [PrepareTasks] Generator {gen_id} timeout after {timeout_per_generator}s in sequential mode")
                            all_coords_by_gen.append([])
                            # daemon thread will automatically terminate when main program exits, will not block main program
                            # thread will continue to run in background, but will not affect subsequent generator processing
                        elif result_container['done']:
                            if result_container['exception']:
                                if debug_mode:
                                    print(f"      [PrepareTasks] Generator {gen_id} failed: {result_container['exception']}")
                                all_coords_by_gen.append([])
                            else:
                                all_coords_by_gen.append(result_container['result'])
                        else:
                            # should not reach here, but return empty list for safety
                            all_coords_by_gen.append([])
                    except Exception as e2:
                        if debug_mode:
                            print(f"      [PrepareTasks] Generator {gen_id} failed even in sequential mode: {e2}")
                        all_coords_by_gen.append([])
        else:
            # single generator when directly call (also add timeout protection)
            timeout_per_generator = 10.0
            try:
                # use daemon thread to implement timeout protection, ensure timeout will not block main program
                result_container = {'result': None, 'done': False, 'exception': None}
                
                def run_generator():
                    try:
                        result_container['result'] = generate_instances_for_single_generator(
                            generator_ids[0], 
                            generator_codes[0]
                        )
                    except Exception as e:
                        result_container['exception'] = e
                    finally:
                        result_container['done'] = True
                
                thread = threading.Thread(target=run_generator, daemon=True)
                thread.start()
                thread.join(timeout=timeout_per_generator)
                
                if thread.is_alive():
                    # thread is still running, timed out
                    if debug_mode:
                        print(f"      [PrepareTasks] Single generator timeout after {timeout_per_generator}s")
                    all_coords_by_gen = [[]]
                    # daemon thread will automatically terminate when main program exits, will not block main program
                elif result_container['done']:
                    if result_container['exception']:
                        if debug_mode:
                            print(f"      [PrepareTasks] Single generator failed: {result_container['exception']}")
                        all_coords_by_gen = [[]]
                    else:
                        all_coords_by_gen = [result_container['result']]
                else:
                    # should not reach here, but return empty list for safety
                    all_coords_by_gen = [[]]
            except Exception as e:
                if debug_mode:
                    print(f"      [PrepareTasks] Single generator failed: {e}")
                all_coords_by_gen = [[]]
    
    # Step 2: parallel compute oracle for all instances (if not provided cached instances)
    # collect all instances: (generator_id, instance_index, coords)
    all_instances_with_metadata = []
    for gen_idx, gen_id in enumerate(generator_ids):
        coords_list = all_coords_by_gen[gen_idx]
        for inst_idx, coords in enumerate(coords_list):
            all_instances_with_metadata.append((gen_id, inst_idx, coords))
    
    optimal_costs_dict = {}  # {(generator_id, instance_index): optimal_cost}
    if cached_oracle_costs is not None:
        # use cached oracle costs
        optimal_costs_dict = cached_oracle_costs
        if debug_mode:
            print(f"[PrepareTasks] Using cached oracle costs: {len(optimal_costs_dict)} entries")
    elif use_gap and len(all_instances_with_metadata) > 0:
        try:
            from ...oracle import create_tsp_oracle
            
            lkh_runs_config = lkh_runs if lkh_runs is not None else 1
            # parallel degree: use optimal_parallel_n_jobs if provided, otherwise default -1
            oracle_n_jobs = optimal_parallel_n_jobs if (optimal_parallel_n_jobs is not None) else -1
            if debug_mode:
                workers = effective_n_jobs(oracle_n_jobs)
                print(f"[Oracle] instances={len(all_instances_with_metadata)}, backend=threading, n_jobs={oracle_n_jobs} -> workers={workers}, lkh_runs={lkh_runs_config}")
            
            def compute_single_oracle_cost(coords):
                try:
                    # use parameters to create oracle
                    oracle_kwargs = {
                        'oracle_timeout': oracle_timeout,
                        'runs': lkh_runs_config,
                    }
                    if lkh3_path is not None:
                        oracle_kwargs['lkh3_path'] = lkh3_path
                    if concorde_path is not None:
                        oracle_kwargs['concorde_path'] = concorde_path
                    local_oracle = create_tsp_oracle(gap_oracle, **oracle_kwargs)
                    return local_oracle.solve_exact(coords)
                except Exception as e:
                    if debug_mode:
                        print(f"      [PrepareTasks] Warning: Oracle failed: {e}")
                    return None
            
            oracle_start_time = time.time()
            try:
                optimal_costs_list = Parallel(
                    n_jobs=oracle_n_jobs,
                    backend="threading",
                    prefer="threads",
                    timeout=oracle_timeout * len(all_instances_with_metadata) * lkh_runs_config * 1.5,
                    # Don't set pre_dispatch when n_jobs=-1, let joblib use default
                    batch_size="auto",
                    verbose=10 if debug_mode else 0,
                )(
                    delayed(compute_single_oracle_cost)(coords) 
                    for gen_id, inst_idx, coords in all_instances_with_metadata
                )
                for (gen_id, inst_idx, _), optimal_cost in zip(all_instances_with_metadata, optimal_costs_list):
                    optimal_costs_dict[(gen_id, inst_idx)] = optimal_cost
            except Exception as e:
                if debug_mode:
                    print(f"      [PrepareTasks] Warning: Parallel oracle failed: {e}")
            finally:
                oracle_time = time.time() - oracle_start_time
                try:
                    from ...utils.evaluation_timer import get_timer
                    timer = get_timer()
                    timer.add_oracle_time(oracle_time)
                except Exception:
                    pass  # Silently fail if timer not available
        except Exception as e:
            if debug_mode:
                print(f"      [PrepareTasks] Warning: Oracle initialization failed: {e}")
    
    # Step 3: pre-compile all solver modules (add timeout protection)
    solver_modules = []
    timeout_per_solver = 5.0  # each solver compile最多5秒

    for solver_id, solver_code in zip(solver_ids, solver_codes):
        try:
            with warnings.catch_warnings():
                warnings.simplefilter("ignore")
                # use ThreadPoolExecutor to add timeout protection
                with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
                    def compile_solver():
                        heuristic_module = types.ModuleType(f"heuristic_module_{solver_id}")
                        exec(solver_code, heuristic_module.__dict__)
                        return heuristic_module
                    
                    try:
                        future = executor.submit(compile_solver)
                        heuristic_module = future.result(timeout=timeout_per_solver)
                        solver_modules.append(heuristic_module)
                    except concurrent.futures.TimeoutError:
                        if debug_mode:
                            print(f"      [PrepareTasks] Solver {solver_id} compilation timeout after {timeout_per_solver}s")
                        solver_modules.append(None)
                        future.cancel()
        except Exception as e:
            if debug_mode:
                print(f"      [PrepareTasks] Error compiling solver {solver_id}: {e}")
            solver_modules.append(None)
    
    # Step 4: generate all tasks
    # format: (solver_id, generator_id, coords, optimal_cost, weight, time_limit, ite_max, perturbation_moves, heuristic_module)
    all_tasks = []
    for solver_idx, solver_id in enumerate(solver_ids):
        if solver_modules[solver_idx] is None:
            continue
        
        heuristic_module = solver_modules[solver_idx]
        
        for gen_idx, gen_id in enumerate(generator_ids):
            coords_list = all_coords_by_gen[gen_idx]
            weight = generator_weights[gen_idx] if gen_idx < len(generator_weights) else 0.0
            
            for inst_idx, coords in enumerate(coords_list):
                optimal_cost = optimal_costs_dict.get((gen_id, inst_idx), None)
                all_tasks.append((
                    solver_id, gen_id, coords, optimal_cost, weight,
                    time_limit, ite_max, perturbation_moves,
                    heuristic_module
                ))
    
    if debug_mode:
        print(f"[PrepareTasks] Generated {len(all_tasks)} tasks: {len(solver_ids)} solvers × {len(generator_ids)} generators × {n_instances} instances")
    
    return all_tasks, all_coords_by_gen, optimal_costs_dict

