from __future__ import annotations

from typing import List, Callable, Dict, Tuple, Optional, Any
import numpy as np
import types
import warnings
from collections import defaultdict
from joblib import Parallel, delayed
from joblib.parallel import effective_n_jobs
from joblib.externals.loky.process_executor import TerminatedWorkerError
import concurrent.futures
import time
import threading

from ...evaluation import online_binpack
from ...oracle import create_bp_online_oracle

# Try to import scipy.special.erf for numpy.erf compatibility
try:
    from scipy.special import erf as scipy_erf
    HAS_SCIPY_ERF = True
except ImportError:
    HAS_SCIPY_ERF = False
    # Fallback: use math.erf if available (Python 3.7+)
    try:
        from math import erf as math_erf
        scipy_erf = math_erf
    except ImportError:
        scipy_erf = None


def prepare_exec_namespace() -> Dict[str, Any]:
    """
    Prepare a namespace for exec() that includes numpy.erf compatibility.
    
    Returns:
        Dictionary with numpy and other standard imports, including numpy.erf
    """
    namespace = {
        '__builtins__': __builtins__,
        'numpy': np,
        'np': np,
    }
    
    # Add numpy.erf compatibility
    # Since numpy doesn't have erf in newer versions, we add it directly to the namespace
    # This avoids pickling issues with wrapper classes
    if HAS_SCIPY_ERF and scipy_erf is not None:
        # Add erf as a standalone function in the namespace
        namespace['erf'] = scipy_erf
        # Also try to add it to numpy module (may not work if numpy is read-only)
        try:
            # Create a copy of numpy module attributes and add erf
            # This is safer than modifying the original numpy module
            import types
            numpy_module = types.ModuleType('numpy')
            # Copy all numpy attributes
            for attr_name in dir(np):
                if not attr_name.startswith('_'):
                    try:
                        setattr(numpy_module, attr_name, getattr(np, attr_name))
                    except (TypeError, AttributeError):
                        pass
            numpy_module.erf = scipy_erf
            namespace['numpy'] = numpy_module
            namespace['np'] = numpy_module
        except Exception:
            # If that fails, just add erf to namespace and let code use it directly
            # Code can use: erf(x) instead of numpy.erf(x)
            pass
    
    return namespace


def evaluate_single_solver_instance(
    solver_id: int,
    generator_id: int,
    instance: Dict,
    optimal_lb: Optional[float],
    weight: float,  # Weight is included in task but not used in evaluation
    time_limit: int,
    heuristic_module,
    oracle_type: Optional[str] = None,  # Oracle type for debugging
    oracle_status: Optional[str] = None  # Oracle status (OPTIMAL, FEASIBLE, etc.)
) -> Tuple[int, int, float]:
    """
    Evaluate a single (solver, generator_instance) combination.
    
    This is a unified evaluation function used for both solver and generator.
    
    Args:
        solver_id: Solver ID
        generator_id: Generator ID
        instance: BP Online instance dict with 'items', 'capacity', 'num_items'
        optimal_lb: Optimal lower bound (for gap calculation)
        time_limit: Time limit (not used for BP Online, but kept for consistency)
        heuristic_module: Compiled heuristic module
        oracle_type: Oracle type ("cp-sat", "lb", etc.) for debugging purposes
        oracle_status: Oracle status ("OPTIMAL", "FEASIBLE", "LB", etc.) for debugging
        
    Returns:
        (solver_id, generator_id, gap)
    """
    try:
        # Compile code from module (extract code string if needed)
        # For now, we assume heuristic_module is already compiled
        # We need to evaluate using the module's score function
        
        # Get instance data
        capacity = instance['capacity']
        items = np.array(instance['items'], dtype=float)  # Ensure float type
        num_items = instance['num_items']
        
        # Create bins
        # Use float type to avoid type casting errors in score functions
        bins = np.array([float(capacity) for _ in range(num_items)], dtype=float)
        
        # Pack items using online_binpack
        packing, bins_packed = online_binpack(items, bins, heuristic_module)
        
        # Count used bins - use packing length which is more reliable
        # packing already filters out unused bins, so len(packing) is the actual number of bins used
        num_bins = len(packing)
        # Compute gap
        if optimal_lb is not None and optimal_lb > 0:
            gap = (num_bins / optimal_lb - 1.0) * 100.0
            
            if oracle_status and oracle_status != "OPTIMAL":
                oracle_info = f"oracle={oracle_type}" if oracle_type else "oracle=unknown"
                print(f"      [WARNING] Not using optimal solution: solver_id={solver_id}, gen_id={generator_id}, "
                      f"status={oracle_status}, optimal_lb={optimal_lb:.5f}, "
                      f"{oracle_info}, capacity={capacity}, num_items={num_items}", flush=True)
        else:
            gap = float('inf')
        return solver_id, generator_id, float(gap)
    except Exception as e:
        if hasattr(e, '__traceback__'):
            import traceback
            traceback.print_exc()
        return solver_id, generator_id, 1e9


def batch_evaluate_tasks(
    tasks: List[Tuple],
    evaluate_fn: Callable,
    n_jobs: int = -1,
    backend: str = "threading",
    prefer: str = "threads",
    timeout: Optional[float] = None,
    debug_mode: bool = False,
    track_time: bool = False,
    time_key: str = "solver",  # "solver" or "generator"
    task_batch_size: Optional[int] = None,
) -> Dict[Tuple[int, int], float]:
    """
    Unified batch evaluation function: parallel evaluate all tasks, average over instances for each (solver_id, generator_id) and return.
    
    Args:
        tasks: List of tasks to evaluate, each task is unpacked and passed to evaluate_fn
        evaluate_fn: Function to evaluate a single task
            Signature: fn(*task_args) -> (solver_id, generator_id, gap)
        n_jobs, backend, prefer, timeout: Parallel execution parameters
        task_batch_size: Max number of tasks per internal Parallel call (None = use default)
        debug_mode: Whether to print debug information
        
    Returns:
        Dictionary mapping (solver_id, generator_id) -> mean_gap (averaged over instances)
    """
    if len(tasks) == 0:
        return {}
    
    parallel_kwargs = {
        'n_jobs': n_jobs,
        'backend': backend,
        'prefer': prefer,
        'batch_size': "auto",
    }
    # Only set pre_dispatch if n_jobs > 0, otherwise let joblib use default
    if n_jobs > 0:
        parallel_kwargs['pre_dispatch'] = "2*n_jobs"
    if timeout is not None:
        parallel_kwargs['timeout'] = timeout
    
    if debug_mode:
        workers = effective_n_jobs(n_jobs)
        parallel_kwargs['verbose'] = 10
    
    # Track evaluation time if requested
    eval_start_time = time.time()
    
    # batch execute, avoid submitting large tasks at once, and add timeout protection
    # default batch_size: if not specified, use min(96, n_jobs*2, len(tasks)), avoid creating too many processes at once
    if task_batch_size is None or task_batch_size <= 0:
        # smart default value: set reasonable batch_size based on worker count
        if n_jobs > 0:
            default_batch_size = min(96, max(effective_n_jobs(n_jobs) * 2, 16), len(tasks))
        else:
            default_batch_size = min(96, len(tasks))
        effective_batch_size = default_batch_size
    else:
        effective_batch_size = task_batch_size
    
    effective_batch_size = min(effective_batch_size, len(tasks))
    effective_batch_size = max(1, effective_batch_size)
    n_batches = (len(tasks) + effective_batch_size - 1) // effective_batch_size
    
    if debug_mode:
        if n_batches > 1:
            print(f"      [BatchEval] Will process {len(tasks)} tasks in {n_batches} batches (batch_size={effective_batch_size})", flush=True)
        else:
            print(f"      [BatchEval] Processing {len(tasks)} tasks in a single batch", flush=True)
        if n_jobs > 0:
            actual_workers = effective_n_jobs(n_jobs)
            print(f"[BatchEval] Using {actual_workers} parallel workers (requested n_jobs={n_jobs})", flush=True)
            print(f"[BatchEval] Each batch will process up to {effective_batch_size} tasks with {actual_workers} workers", flush=True)
    
    batch_timeout = None
    if timeout is not None:
        batch_timeout = timeout / n_batches * 1.2  # add 20% buffer time for each batch
    else:
        batch_timeout = len(tasks) * 60.0 / max(1, effective_n_jobs(n_jobs)) / n_batches * 1.5
        batch_timeout = max(batch_timeout, 300.0)  # at least 5 minutes
    
    all_results = []
    try:
        for batch_idx in range(n_batches):
            start = batch_idx * effective_batch_size
            end = min(start + effective_batch_size, len(tasks))
            batch_tasks = tasks[start:end]
            
            batch_start_time = time.time()
            
            if debug_mode:
                print(f"      [BatchEval] Processing batch {batch_idx + 1}/{n_batches} (tasks {start+1}-{end}/{len(tasks)}, timeout={batch_timeout:.1f}s)...", flush=True)
            
            batch_results = []
            batch_timeout_flag = threading.Event()
            
            def batch_timeout_monitor():
                elapsed = time.time() - batch_start_time
                while elapsed < batch_timeout and not batch_timeout_flag.is_set():
                    time.sleep(1.0)
                    elapsed = time.time() - batch_start_time
                if elapsed >= batch_timeout and not batch_timeout_flag.is_set():
                    batch_timeout_flag.set()
                    if debug_mode:
                        print(f"      [BatchEval] Batch {batch_idx + 1}/{n_batches} timeout detected after {elapsed:.1f}s", flush=True)
            
            monitor_thread = None
            if batch_timeout is not None and batch_timeout > 0:
                monitor_thread = threading.Thread(target=batch_timeout_monitor, daemon=True)
                monitor_thread.start()
            
            try:
                batch_parallel_kwargs = parallel_kwargs.copy()
                batch_parallel_kwargs['timeout'] = batch_timeout
                
                def run_parallel():
                    with Parallel(**batch_parallel_kwargs) as parallel_executor:
                        return parallel_executor(
                            delayed(evaluate_fn)(*task) for task in batch_tasks
                        )
                
                with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
                    future = executor.submit(run_parallel)
                    try:
                        batch_results = future.result(timeout=batch_timeout)
                        batch_timeout_flag.set() 
                    except concurrent.futures.TimeoutError:
                        batch_timeout_flag.set()
                        future.cancel()
                        try:
                            concurrent.futures.wait([future], timeout=2.0)
                        except Exception:
                            pass
                        raise TimeoutError(f"Batch {batch_idx + 1} exceeded timeout {batch_timeout:.1f}s")
                
                batch_time = time.time() - batch_start_time
                if debug_mode:
                    print(f"      [BatchEval] Batch {batch_idx + 1}/{n_batches} completed in {batch_time:.1f}s ({len(batch_results)} results)", flush=True)
                    
            except (TimeoutError, concurrent.futures.TimeoutError, TerminatedWorkerError) as e:
                batch_timeout_flag.set()
                batch_time = time.time() - batch_start_time
                if debug_mode:
                    print(f"      [BatchEval] Batch {batch_idx + 1}/{n_batches} timeout after {batch_time:.1f}s: {type(e).__name__}", flush=True)
                    print(f"      [BatchEval] Skipping remaining tasks in this batch and continuing...", flush=True)
                batch_results = []
                for task in batch_tasks:
                    try:
                        solver_id = task[0]
                        generator_id = task[1]
                        batch_results.append((solver_id, generator_id, 1e9))
                    except (IndexError, TypeError):
                        batch_results.append((0, 0, 1e9))
                        
            except Exception as e:
                batch_timeout_flag.set()
                batch_time = time.time() - batch_start_time
                if debug_mode:
                    print(f"      [BatchEval] Batch {batch_idx + 1}/{n_batches} failed after {batch_time:.1f}s: {type(e).__name__}: {e}", flush=True)
                    if batch_time < batch_timeout:
                        print(f"      [BatchEval] Attempting sequential fallback for batch {batch_idx + 1}/{n_batches}...", flush=True)
                        try:
                            batch_results = [evaluate_fn(*task) for task in batch_tasks]
                            if debug_mode:
                                print(f"      [BatchEval] Sequential fallback succeeded for batch {batch_idx + 1}/{n_batches}", flush=True)
                        except Exception as e2:
                            if debug_mode:
                                print(f"      [BatchEval] Sequential fallback also failed: {e2}", flush=True)
                            batch_results = []
                            for task in batch_tasks:
                                try:
                                    solver_id = task[0]
                                    generator_id = task[1]
                                    batch_results.append((solver_id, generator_id, 1e9))
                                except (IndexError, TypeError):
                                    batch_results.append((0, 0, 1e9))
                    else:
                        batch_results = []
                        for task in batch_tasks:
                            try:
                                solver_id = task[0]
                                generator_id = task[1]
                                batch_results.append((solver_id, generator_id, 1e9))
                            except (IndexError, TypeError):
                                batch_results.append((0, 0, 1e9))
                else:
                    batch_time = time.time() - batch_start_time
                    if batch_time < batch_timeout:
                        try:
                            batch_results = [evaluate_fn(*task) for task in batch_tasks]
                        except Exception:
                            batch_results = []
                            for task in batch_tasks:
                                try:
                                    solver_id = task[0]
                                    generator_id = task[1]
                                    batch_results.append((solver_id, generator_id, 1e9))
                                except (IndexError, TypeError):
                                    batch_results.append((0, 0, 1e9))
                    else:
                        batch_results = []
                        for task in batch_tasks:
                            try:
                                solver_id = task[0]
                                generator_id = task[1]
                                batch_results.append((solver_id, generator_id, 1e9))
                            except (IndexError, TypeError):
                                batch_results.append((0, 0, 1e9))
            
            finally:
                batch_timeout_flag.set()
            
            all_results.extend(batch_results)
    
    except Exception as e:
        if debug_mode:
            print(f"      [BatchEval] Batch processing failed: {type(e).__name__}: {e}", flush=True)
            print(f"      [BatchEval] Falling back to sequential execution...", flush=True)
        try:
            all_results = [evaluate_fn(*task) for task in tasks]
        except Exception as e2:
            if debug_mode:
                print(f"      [BatchEval] Sequential fallback also failed: {e2}", flush=True)
            all_results = []
            for task in tasks:
                try:
                    solver_id = task[0]
                    generator_id = task[1]
                    all_results.append((solver_id, generator_id, 1e9))
                except (IndexError, TypeError):
                    all_results.append((0, 0, 1e9))
    
    results = all_results
    
    eval_time = time.time() - eval_start_time
    
    if track_time:
        try:
            from ....utils.evaluation_timer import get_timer
            timer = get_timer()
            if time_key == "solver":
                timer.add_solver_evaluation_time(eval_time)
            elif time_key == "generator":
                timer.add_generator_evaluation_time(eval_time)
        except Exception:
            pass  # Silently fail if timer not available
    
    # Aggregate results by (solver_id, generator_id)
    results_dict = defaultdict(list)
    for solver_id, generator_id, gap in results:
        if np.isfinite(gap) and gap < 1e8:  # Filter out invalid results
            results_dict[(solver_id, generator_id)].append(gap)
    
    # Compute mean gap for each (solver_id, generator_id) pair
    mean_results = {}
    for (solver_id, generator_id), gaps in results_dict.items():
        mean_gap = float(np.mean(gaps))
        mean_results[(solver_id, generator_id)] = mean_gap
    
    
    return mean_results


def prepare_tasks(
    solver_codes: List[str],
    solver_ids: List[int],
    generator_codes: List[str],
    generator_ids: List[int],
    generator_weights: np.ndarray,
    n_instances: int,
    capacity: int,
    num_items: int,
    time_limit: int,
    use_gap: bool,
    gap_oracle: str,
    oracle_timeout: int,
    optimal_parallel_n_jobs: Optional[int] = None,
    debug_mode: bool = False,
    cached_instances: Optional[List[List[Dict]]] = None,
    cached_oracle_costs: Optional[Dict[Tuple[int, int], float]] = None,
    config: Optional[Any] = None
) -> Tuple[List[Tuple], List[List[Dict]], Dict[Tuple[int, int], float]]:
    """
    Unified prepare_tasks function: prepare evaluation tasks for all (solver, generator) combinations.
    
    Args:
        solver_codes: List of solver code strings
        solver_ids: List of solver IDs
        generator_codes: List of generator code strings
        generator_ids: List of generator IDs
        generator_weights: Array of weights for each generator
        n_instances: Number of instances to generate per generator
        capacity: Bin capacity
        num_items: Number of items per instance
        time_limit: Time limit (not used for BP Online, but kept for consistency)
        use_gap: Whether to compute gap (requires oracle)
        gap_oracle: Oracle type ("lb" or "none")
        oracle_timeout: Timeout for oracle (seconds)
        optimal_parallel_n_jobs: Parallel jobs for oracle computation
        debug_mode: Whether to print debug information
        
    Returns:
        Tuple of:
        - all_tasks: List of tasks
        - all_instances_by_gen: List[List[Dict]] - instances per generator (for caching)
        - optimal_costs_dict: Dict[(gen_id, inst_idx): optimal_lb] - oracle costs (for caching)
    """
    # Validate inputs
    if n_instances is None or n_instances <= 0:
        raise ValueError(f"prepare_tasks: n_instances must be a positive integer, got {n_instances}")
    if capacity is None or capacity <= 0:
        raise ValueError(f"prepare_tasks: capacity must be a positive integer, got {capacity}")
    if num_items is None or num_items <= 0:
        raise ValueError(f"prepare_tasks: num_items must be a positive integer, got {num_items}")
    
    n_instances = int(n_instances)
    time_limit = int(time_limit)
    capacity = int(capacity)
    num_items = int(num_items)
    
    # Step 1: Generate instances from all generators
    if cached_instances is not None:
        all_instances_by_gen = cached_instances
    else:
        def generate_instances_for_single_generator(gen_id, gen_code):
            """Generate instances for a single generator (simplified, timeout handled by joblib.Parallel)"""
            try:
                with warnings.catch_warnings():
                    warnings.simplefilter("ignore")
                    gen_mod = types.ModuleType(f"generator_module_{gen_id}")
                    exec_namespace = prepare_exec_namespace()
                    exec_namespace.update(gen_mod.__dict__)
                    exec(gen_code, exec_namespace)
                    gen_mod.__dict__.update(exec_namespace)
                    
                    if not hasattr(gen_mod, "generate_instances"):
                        return []
                    
                    seeds = np.arange(n_instances, dtype=int)
                    # Generator now returns List[np.ndarray], each is items array
                    items_arrays = gen_mod.generate_instances(seeds, capacity, num_items)
                    
                    # External wrapper assembles dict format
                    valid_instances = []
                    for items in items_arrays:
                        # Validate items array
                        items = np.asarray(items, dtype=int)
                        if len(items) != num_items:
                            continue
                        if items.min() < 1 or items.max() >= capacity:
                            continue
                        
                        # Assemble into standard dict format
                        inst = {
                            'items': items,
                            'capacity': capacity,
                            'num_items': num_items
                        }
                        valid_instances.append(inst)
                    return valid_instances
            except Exception:
                return []
        
        # Generate instances in batches to avoid timeout
        batch_size = 20  # Process 20 generators per batch
        n_generators = len(generator_codes)
        
        def _generate_with_id(args):
            """Wrapper for parallel execution"""
            idx, gen_id, gen_code = args
            try:
                instances = generate_instances_for_single_generator(gen_id, gen_code)
                return idx, instances
            except Exception:
                return idx, []
        
        all_instances_by_gen = [None] * n_generators  # Pre-allocate list
        
        if n_generators > 1:
            # Process in batches
            n_workers = min(batch_size, 16)  # Limit workers per batch
            n_batches = (n_generators + batch_size - 1) // batch_size
            
            for batch_idx in range(n_batches):
                start_idx = batch_idx * batch_size
                end_idx = min(start_idx + batch_size, n_generators)
                batch_generator_ids = generator_ids[start_idx:end_idx]
                batch_generator_codes = generator_codes[start_idx:end_idx]
                
                try:
                    results = Parallel(
                        n_jobs=n_workers,
                        backend="threading",
                        prefer="threads",
                        verbose=0,
                        timeout=10.0  # 10 seconds per batch
                    )(
                        delayed(_generate_with_id)((start_idx + i, gen_id, gen_code))
                        for i, (gen_id, gen_code) in enumerate(zip(batch_generator_ids, batch_generator_codes))
                    )
                    # Store results in correct positions
                    for idx, instances in results:
                        all_instances_by_gen[idx] = instances
                except Exception:
                    # Fill batch with empty results
                    for i in range(start_idx, end_idx):
                        all_instances_by_gen[i] = []
        else:
            # Single generator
            gen_id, gen_code = generator_ids[0], generator_codes[0]
            instances = generate_instances_for_single_generator(gen_id, gen_code)
            all_instances_by_gen = [instances]
        
    # Step 2: Compute oracle (lb) for all instances
    all_instances_with_metadata = []
    for gen_idx, gen_id in enumerate(generator_ids):
        inst_list = all_instances_by_gen[gen_idx]
        for inst_idx, instance in enumerate(inst_list):
            all_instances_with_metadata.append((gen_id, inst_idx, instance))
    
    optimal_costs_dict = {}
    if cached_oracle_costs is not None:
        optimal_costs_dict = cached_oracle_costs
    elif use_gap and len(all_instances_with_metadata) > 0:
        try:
            oracle_n_jobs = optimal_parallel_n_jobs if (optimal_parallel_n_jobs is not None) else -1
            
            def compute_single_oracle_cost(instance):
                try:
                    if config is not None:
                        oracle = create_bp_online_oracle(
                            config=config,
                            oracle_type=gap_oracle,  # 可以覆盖 config 中的 oracle_type
                        )
                    else:
                        oracle = create_bp_online_oracle(oracle_type=gap_oracle)
                    result = oracle.solve_exact(instance)
                    if isinstance(result, tuple):
                        return result
                    else:
                        return (result, "UNKNOWN")
                except Exception:
                    return None
            oracle_start_time = time.time()
            try:
                optimal_costs_list = Parallel(
                    n_jobs=oracle_n_jobs,
                    backend="threading",
                    prefer="threads",
                    batch_size="auto",
                    verbose=10 if debug_mode else 0,
                )(
                    delayed(compute_single_oracle_cost)(instance)
                    for gen_id, inst_idx, instance in all_instances_with_metadata
                )
                for (gen_id, inst_idx, _), optimal_cost in zip(all_instances_with_metadata, optimal_costs_list):
                    optimal_costs_dict[(gen_id, inst_idx)] = optimal_cost
            except Exception:
                pass
            finally:
                oracle_time = time.time() - oracle_start_time
                try:
                    from ....utils.evaluation_timer import get_timer
                    timer = get_timer()
                    timer.add_oracle_time(oracle_time)
                except Exception:
                    pass
        except Exception:
            pass

    # Step 3: Pre-compile all solver modules
    solver_modules = []
    
    def compile_solver(solver_id, solver_code):
        """Compile a single solver with timeout protection"""
        def _compile():
            try:
                with warnings.catch_warnings():
                    warnings.simplefilter("ignore")
                    heuristic_module = types.ModuleType(f"heuristic_module_{solver_id}")
                    exec_namespace = prepare_exec_namespace()
                    exec_namespace.update(heuristic_module.__dict__)
                    exec(solver_code, exec_namespace)
                    heuristic_module.__dict__.update(exec_namespace)
                    
                    # Verify that the module has a score function
                    if not hasattr(heuristic_module, 'score') or not callable(getattr(heuristic_module, 'score', None)):
                        return None
                    
                    return heuristic_module
            except Exception:
                return None
        
        try:
            with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
                future = executor.submit(_compile)
                return future.result(timeout=10.0)  # 10秒超时
        except (concurrent.futures.TimeoutError, Exception):
            return None
    
    for solver_id, solver_code in zip(solver_ids, solver_codes):
        solver_modules.append(compile_solver(solver_id, solver_code))
    
    # Step 4: Generate all tasks
    # Format: (solver_id, generator_id, instance, optimal_lb, weight, time_limit, heuristic_module, oracle_type, oracle_status)
    all_tasks = []
    for solver_idx, solver_id in enumerate(solver_ids):
        if solver_modules[solver_idx] is None:
            continue
        
        heuristic_module = solver_modules[solver_idx]
        
        for gen_idx, gen_id in enumerate(generator_ids):
            inst_list = all_instances_by_gen[gen_idx]
            weight = generator_weights[gen_idx] if gen_idx < len(generator_weights) else 0.0
            
            for inst_idx, instance in enumerate(inst_list):
                optimal_result = optimal_costs_dict.get((gen_id, inst_idx), None)
                if optimal_result is None:
                    optimal_lb = None
                    oracle_status = None
                elif isinstance(optimal_result, tuple):
                    optimal_lb, oracle_status = optimal_result
                else:
                    optimal_lb = optimal_result
                    oracle_status = "UNKNOWN"
                all_tasks.append((
                    solver_id, gen_id, instance, optimal_lb, weight,
                    time_limit, heuristic_module, gap_oracle, oracle_status
                ))
    
    return all_tasks, all_instances_by_gen, optimal_costs_dict

