from __future__ import annotations

import json
import os
from dataclasses import asdict
from typing import Dict, List, Optional, Tuple
from datetime import datetime
import time
import numpy as np
from joblib import Parallel, delayed

from .config import HeuPSROConfig
from .resume import recover_missing_strategies, load_utilities_with_fallback, resume_from_checkpoint
from .metagame import MetaGame
from .pools import StrategyPools
from .context_builder import build_solver_context, build_generator_context
from .base.problem_adapter import ProblemAdapter
from ..utils.reporting_utils import print_iteration_summary, save_diversity_report


class HeuPSROController:
    """Controller that eoh_management_strategys init/resume, incremental U, NE, and BR training.

    - Does NOT modify upstream eoh; uses problem adapter for evolution.
    - Maintains incremental utility matrix; only evaluates new rows/cols.
    - Supports minimum simple/baseline generator sampling ratio throughout.
    - Problem-agnostic: delegates problem-specific logic to ProblemAdapter.
    """

    def __init__(self, cfg: HeuPSROConfig, out_dir: str, problem_adapter: ProblemAdapter = None) -> None:
        self.cfg = cfg
        self.out_dir = out_dir
        os.makedirs(self.out_dir, exist_ok=True)
        
        # Initialize experiment file manager (delayed import to avoid circular import)
        from ..experiments.manager import ExperimentFileManager
        self.file_manager = ExperimentFileManager(self.out_dir)
        
        self.debug_mode = getattr(cfg, 'debug_mode', False)
        self.meta = MetaGame()
        self.pools = StrategyPools(meta=self.meta) 
        self.seed = cfg.seed
        self.iteration = 0
        np.random.seed(self.seed)
        
        self._utility_cache = {}

        # Track EOH generation numbers for continuation
        self._solver_eoh_generation = 0
        self._generator_eoh_generation = 0

        self.solver_eoh_dir = self.file_manager.paths.solver_eoh_dir
        self.generator_eoh_dir = self.file_manager.paths.generator_eoh_dir
        
        # Set up problem adapter (for backward compatibility, auto-detect TSP if not provided)
        if problem_adapter is None:
            # Auto-detect TSP problem (backward compatibility)
            if hasattr(cfg, 'n_cities') and cfg.n_cities is not None:
                from ..problems.tsp_gls.adapter import TSPProblemAdapter
                self.problem_adapter = TSPProblemAdapter(cfg)
            else:
                raise ValueError("No problem_adapter provided and cannot auto-detect problem type")
        else:
            self.problem_adapter = problem_adapter
        
        # Create EoH bridge via problem adapter
        self.eoh = self.problem_adapter.create_eoh_bridge(
            cfg, self.solver_eoh_dir, self.generator_eoh_dir
        )
        
        # Initialize utilities
        from ..utils.save_utils import ExperimentSaver
        from ..utils import StrategyVisualizer
        self.saver = ExperimentSaver(out_dir, self.file_manager)
        self.visualizer = StrategyVisualizer(out_dir, self.debug_mode)
        
        # Save initial experiment metadata
        self.saver.save_experiment_metadata(cfg)
        
        # Initialize PSRO diversity components if enabled (may wrap pools)
        self._init_diversity_components()
        
        # Create problem-specific sampler via adapter
        sampler = self.problem_adapter.create_sampler(self.pools, cfg)
        if sampler is None:
            raise ValueError("Problem adapter must provide a sampler")
        self.problem_sampler = sampler
        # Keep self.sampler for backward compatibility (may be used in some places)
        self.sampler = sampler
    
    def _init_diversity_components(self) -> None:
        if not self.cfg.psro_diversity_enabled:
            self.pool_manager = None
            return
        
        from .diversity.pool_manager import PoolDiversityManager
        from .diversity.diverse_pools import DiversityAwarePools
        
        # Create pool manager
        self.pool_manager = PoolDiversityManager(self.cfg, self.pools, self.meta)
        self.pools = DiversityAwarePools(self.pools, self.pool_manager, self.meta)

    # ---------- Public API ----------
    def initialize(self) -> None:
        """Fresh initialization: delegate to problem adapter."""
        self.problem_adapter.initialize(self)
        
        # Find h0 and g0 indices after initialization
        h0_idx = None
        g0_idx = None
        for i, s in enumerate(self.pools.solver_pool):
            if s.program_id == "h0":
                h0_idx = i
                break
        for i, g in enumerate(self.pools.generator_pool):
            if g.program_id == "g0":
                g0_idx = i
                break
        
        if h0_idx is not None:
            # Initialize initial utility matrix directly
            self._compute_initial_utility_matrix()

    def _compute_initial_utility_matrix(self) -> None:
        """Compute initial utility matrix: h0 on g0 instances."""
        solver_code = self.pools.get_solver(0).code
        instances = self.problem_sampler.sample_from_single_generator(0, n=self.cfg.eval_n_instances)
        
        # Debug: check instances
        if len(instances) == 0:
            print(f"    WARNING: No instances generated for g0")
        else:
            print(f"    Debug: Generated {len(instances)} instances for g0")
        
        gap_pct = self.problem_adapter.evaluate_solver(solver_code, instances, utility_cache=self._utility_cache)
        self.meta.set_utility(0, 0, gap_pct)
        print(f"    h0 vs g0: gap = {gap_pct:.4f}")
        if np.isinf(gap_pct) or np.isnan(gap_pct):
            print(f"    WARNING: gap is {gap_pct}, this may indicate invalid instances or oracle failure")
        self._utility_cache[(0, 0)] = gap_pct

    def solve_meta_game(self) -> Tuple[np.ndarray, np.ndarray]:
        """Solve meta-game using the configured solver (NE or Alpha-Rank).
        
        Returns:
            sigma_h: Solver mixture weights
            sigma_g: Generator mixture weights
        """
        meta_solver = getattr(self.cfg, 'meta_game_solver', 'ne')
        
        if meta_solver == "alpha_rank":
            alpha = getattr(self.cfg, 'alpha_rank_alpha', 15.0)
            num_iters = getattr(self.cfg, 'alpha_rank_num_iters', 10_000)
            tol = getattr(self.cfg, 'alpha_rank_tol', 1e-10)
            debug_alpha_rank = getattr(self.cfg, 'debug_alpha_rank', False) or self.debug_mode
            sigma_h, sigma_g = self.meta.solve_alpha_rank(
                alpha=alpha,
                num_iters=num_iters,
                tol=tol,
                debug=debug_alpha_rank
            )
        else:  # default to "ne"
            sigma_h, sigma_g = self.meta.solve_ne()
        
        return sigma_h, sigma_g

    def resume(self, state_dir: str, resume_from_round: int = None) -> None:
        """Resume from previous state directory (delegates to resume_from_checkpoint)."""
        resume_state = resume_from_checkpoint(self, state_dir, resume_from_round)
        
        # Set controller state from resume results
        self.iteration = resume_state["iteration"]
        eoh_state = resume_state["eoh_state"]
        self._solver_eoh_generation = eoh_state.get("solver_eoh_generation", 0)
        self._generator_eoh_generation = eoh_state.get("generator_eoh_generation", 0)

    def save(self) -> None:
        """Save current state using the saver utility."""
        self.saver.save_pools_and_utilities(self.pools, self.meta, self.cfg)
        self.saver.save_utility_matrix(self.meta)
        self.saver.save_statistics_table(self.meta, self.pools, self)
        self.saver.save_evolution_tracking(self, self.iteration)
        self.saver.save_performance_metrics(self, self.iteration)
        self.saver.save_checkpoint(self, self.iteration)
        self.saver.save_timing_statistics(self, self.iteration)
        self.saver.save_nash_mixture(self, self.iteration)  # Save sigma and solver mixture
        
        # Save diversity statistics if enabled
        if self.cfg.psro_diversity_enabled and self.pool_manager:
            save_diversity_report(
                self.out_dir, self.iteration, self.pools, self.pool_manager, self.cfg
            )
    

    def iterate_one_round(self) -> None:
        """One PSRO iteration: incremental U → NE → BR(h|σ_G) & BR(g|σ_S) via EoH → expand.

        - First, compute NE on current U.
        - Then, fix generator mix σ_G to evolve solver BR on instances sampled accordingly.
        - Next, fix solver mix σ_S to evolve generator BR that worsens σ_S.
        """
        self.iteration += 1
        print(f" PSRO Iteration {self.iteration}")
        
        # Initialize timing variables
        round_start_time = time.time()
        nash_start = None
        solver_evolution_start = None
        generator_evolution_start = None
        utility_update_start = None
        
        # Single check at the beginning: ensure utilities matrix dimensions match pools
        n_h_meta = self.meta.utilities.shape[0]
        n_g_meta = self.meta.utilities.shape[1]
        n_h_pools = self.pools.n_solvers
        n_g_pools = self.pools.n_generators
        if n_h_meta != n_h_pools or n_g_meta != n_g_pools:
            raise ValueError(
                f"Utilities matrix shape mismatch: meta={self.meta.utilities.shape}, pools=(solvers={n_h_pools}, generators={n_g_pools}). "
                f"This indicates an incorrect resume - please check resume_from_round and ensure files were cleaned properly."
            )
        
        # Step 2: Solve Meta-Game (Nash Equilibrium or Alpha-Rank)
        nash_start = time.time()
        meta_solver = getattr(self.cfg, 'meta_game_solver', 'ne')
        print(f"   Using meta-game solver: {meta_solver} (from config: {getattr(self.cfg, 'meta_game_solver', 'not set')})")
        
        sigma_h, sigma_g_full = self.solve_meta_game()
        
        if meta_solver == "alpha_rank":
            print(f"   Alpha-Rank: σ_H={len(sigma_h)} solvers, σ_G_total={len(sigma_g_full)} generators (incl. simple)")
            debug_alpha_rank = getattr(self.cfg, 'debug_alpha_rank', False) or self.debug_mode
            if debug_alpha_rank:
                alpha = getattr(self.cfg, 'alpha_rank_alpha', 15.0)
                num_iters = getattr(self.cfg, 'alpha_rank_num_iters', 10_000)
                tol = getattr(self.cfg, 'alpha_rank_tol', 1e-10)
                print(f"     Utilities matrix used for calculation:")
                print(f"    {self.meta.utilities}")
                print(f"     Generator pairwise comparison matrix (P_g):")
                P_g = self.meta._generator_pairwise_matrix()
                print(f"    {P_g}")
                print(f"     Alpha-Rank parameters: alpha={alpha}, num_iters={num_iters}, tol={tol}")
        else:
            print(f"   NE: σ_H={len(sigma_h)} solvers, σ_G_total={len(sigma_g_full)} generators (incl. simple)")
        nash_time = time.time() - nash_start
        self._nash_equilibrium_time = nash_time
        
        heuristics = [s.code for s in self.pools.solver_pool]
        
        if getattr(self.cfg, 'psro_use_latest_only', False):
            if self.pools.n_generators > 0:
                latest_g_idx = self.pools.n_generators - 1
                sigma_g_full = np.zeros(self.pools.n_generators)
                sigma_g_full[latest_g_idx] = 1.0
                if self.debug_mode:
                    print(f"   Using latest generator only (index {latest_g_idx}) for solver BR")
            
            # Generator BR
            if self.pools.n_solvers > 0:
                latest_h_idx = self.pools.n_solvers - 1
                sigma_h = np.zeros(self.pools.n_solvers)
                sigma_h[latest_h_idx] = 1.0
                if self.debug_mode:
                    print(f"   Using latest solver only (index {latest_h_idx}) for generator BR")

        # Step 3: Evolve solver BR against fixed σ_G
        print(f"sigma_g_full: {sigma_g_full}")
        solver_code, solver_algorithm, solver_params, solver_score = self._evolve_solver_br(sigma_g_full)
        

        # Step 4: Evolve generator BR against fixed σ_S (can be disabled)
        print(f"sigma_h: {sigma_h}")
        if getattr(self.cfg, 'disable_generator_evolution', False):
            if self.debug_mode:
                print("    Generator evolution disabled; keeping simple/baseline generator only")
            gen_config = {"code": "", "algorithm": "simple_fixed", "params": {}, "score": 0.0}
            generator_score = 0.0
        else:
            gen_config, generator_score = self._evolve_generator_br(heuristics, sigma_h)
        
        
        new_h_idxs, new_g_idxs = self._get_new_indices()
        utility_update_start = time.time()
        self._update_utilities_incremental(new_h_idxs, new_g_idxs)
        utility_update_time = time.time() - utility_update_start
        self._utility_matrix_update_time = utility_update_time
        
        # Calculate total round time
        total_round_time = time.time() - round_start_time
        self._total_round_time = total_round_time
        
        
        print_iteration_summary(
            self.iteration, solver_score, gen_config, sigma_h, sigma_g_full,
            self.meta.utilities.shape, self.meta.utilities,
            self.pool_manager, self.cfg, self.pools
        )

        # self._maybe_remove_initial_solver()

    def _maybe_remove_initial_solver(self):
        h0_idx = None
        for i, s in enumerate(self.pools.solver_pool):
            if s.program_id == "h0":
                h0_idx = i
                break
        if h0_idx is None:
            return 

        if self.pools.n_solvers <= 1:
            return 

        print(f"    Removing initial solver h0 at index {h0_idx}")
        self._utility_cache.clear()
        self.pools.remove_solver(h0_idx)

        n_h_meta, n_g_meta = self.meta.utilities.shape
        assert n_h_meta == self.pools.n_solvers

 
    # ---------- Internals ----------
    
    def _evolve_solver_br(self, sigma_g_full: np.ndarray) -> Tuple[str, str, Dict, float]:
        """
        Evolve solver BR against generator mix σ_G.
        
        Args:
            sigma_g_full: Full generator mixture from NE (includes simple/baseline generator at index 0)
            
        Returns:
            (solver_code, solver_algorithm, solver_params, solver_score)
        """
        if len(self.pools.generator_pool) == 0:
            raise ValueError("No generators in pool")
        
        use_latest_only = getattr(self.cfg, 'psro_use_latest_only', False)
        
        if use_latest_only:
            adjusted_sigma_g_full = sigma_g_full.copy()
        else:
            simple_weight = self.cfg.min_simple_ratio
            remaining_weight = 1.0 - simple_weight
            
            if len(sigma_g_full) == 1:
                adjusted_sigma_g_full = np.array([1.0])
            else:
                adjusted_sigma_g_full = np.zeros_like(sigma_g_full)
                adjusted_sigma_g_full[0] = simple_weight
                
                evolved_weights = sigma_g_full[1:]
                if evolved_weights.sum() > 0:
                    normalized_evolved = evolved_weights / evolved_weights.sum()
                else:
                    normalized_evolved = np.ones(len(evolved_weights)) / len(evolved_weights) if len(evolved_weights) > 0 else evolved_weights
                adjusted_sigma_g_full[1:] = normalized_evolved * remaining_weight
        
        if self.debug_mode:
            print(f"      Strategy C: {len(adjusted_sigma_g_full)} generators, weights={adjusted_sigma_g_full}")
        
        weight_threshold = 0.1
        generator_codes = []
        generator_ids = []
        filtered_weights = []
        
        for pool_idx, gen_prog in enumerate(self.pools.generator_pool):
            if (pool_idx >= len(adjusted_sigma_g_full) or 
                adjusted_sigma_g_full[pool_idx] <= weight_threshold or
                not gen_prog.code):
                continue
            
            weight = adjusted_sigma_g_full[pool_idx]
            gen_code = gen_prog.code
            generator_codes.append(gen_code)
            generator_ids.append(pool_idx)
            filtered_weights.append(weight)
        
        if len(generator_codes) == 0:
            first_code = self.pools.generator_pool[0].code
            if not first_code:
                raise ValueError("No valid generators with code")
            generator_codes = [first_code]
            generator_ids = [0]
            filtered_weights = [1.0]
        
        filtered_weights = np.array(filtered_weights)
        filtered_weights = filtered_weights / filtered_weights.sum()
        
        adjusted_sigma_g_full = filtered_weights
        
        # Build evolution context if enabled
        solver_context = None
        if getattr(self.cfg, 'evolution_context_enabled', True):
            sigma_g = adjusted_sigma_g_full[1:] if len(adjusted_sigma_g_full) > 1 else np.array([])
            solver_context = build_solver_context(self.pools, adjusted_sigma_g_full, sigma_g)
        
        # Run EoH evolution for solver
        solver_evolution_start = time.time()


        solver_results = self.eoh.evolve_solver_oracle_with_population(
            generator_samplers=None, sigma_g=None, n_instances=self.cfg.eoh_eval_n_instances,
            continue_from_generation=self._solver_eoh_generation,
            generator_codes=generator_codes,
            generator_ids=generator_ids,
            generator_weights=adjusted_sigma_g_full,
            evolution_context=solver_context
        )
        solver_evolution_time = time.time() - solver_evolution_start
        self._solver_evolution_time = solver_evolution_time
        solver_n_pop = getattr(self.cfg, 'solver_n_pop', getattr(self.cfg, 'n_pop', 2))
        self._solver_eoh_avg_time_per_gen = solver_evolution_time / solver_n_pop if solver_n_pop > 0 else 0
        
        solver_time_info = getattr(self.eoh, '_last_solver_eoh_time_info', {})
        self._solver_code_generation_time = solver_time_info.get('code_generation_time', None)
        self._solver_evaluation_time = solver_time_info.get('evaluation_time', None)
        
        # Update solver EOH generation for next round
        solver_n_pop = getattr(self.cfg, 'solver_n_pop', getattr(self.cfg, 'n_pop', 2))
        self._solver_eoh_generation += solver_n_pop
        
        # Handle top-k results
        def add_solver(id, code, algorithm, params, score):
            metadata = {"source": "br_solver_sigmaG", "score": score}
            self.pools.add_solver(id, code, algorithm, params, metadata)
        
        success, added_candidate = self._handle_top_k_candidates(
            solver_results, "solver", add_solver, None
        )
        
        if success and added_candidate:
            return added_candidate
        raise ValueError("No solver candidates available")
    
    def _evolve_generator_br(self, heuristics: List[str], sigma_h: np.ndarray) -> Tuple[Dict, float]:
        """
        Evolve generator BR against solver mix σ_S.
        
        Args:
            heuristics: List of solver heuristic codes
            sigma_h: Solver mixture weights
            
        Returns:
            (gen_config, generator_score)
        """
        weight_threshold = 0.1
        heuristics_filtered = []
        sigma_h_filtered = []
        
        for heuristic_code, weight in zip(heuristics, sigma_h):
            if weight > weight_threshold:
                heuristics_filtered.append(heuristic_code)
                sigma_h_filtered.append(weight)
        
        if len(heuristics_filtered) == 0:
            if len(heuristics) == 0:
                raise ValueError("No valid solvers")
            heuristics_filtered = [heuristics[0]]
            sigma_h_filtered = [1.0]
        
        sigma_h_filtered = np.array(sigma_h_filtered)
        sigma_h_filtered = sigma_h_filtered / sigma_h_filtered.sum()
        
        if self.debug_mode:
            print(f"      Generator BR: {len(heuristics_filtered)} solvers (after filtering), weights={sigma_h_filtered}")
        
        # Build evolution context if enabled
        generator_context = None
        if getattr(self.cfg, 'evolution_context_enabled', True):
            generator_context = build_generator_context(self.pools, heuristics_filtered, sigma_h_filtered)
        
        # Run EoH evolution for generator
        generator_evolution_start = time.time()
        if self.debug_mode:
            print(f"      [GeneratorEvol] Starting EOH evolution with {len(heuristics_filtered)} solvers...", flush=True)
        generator_results = self.eoh.evolve_generator_oracle_with_population(
            heuristics_filtered, sigma_h_filtered,
            continue_from_generation=self._generator_eoh_generation,
            evolution_context=generator_context
        )
        generator_evolution_time = time.time() - generator_evolution_start
        print(f"      [GeneratorEvol] EOH evolution completed in {generator_evolution_time:.1f}s", flush=True)
        generator_evolution_time = time.time() - generator_evolution_start
        self._generator_evolution_time = generator_evolution_time
        generator_n_pop = getattr(self.cfg, 'generator_n_pop', getattr(self.cfg, 'n_pop', 2))
        self._generator_eoh_avg_time_per_gen = generator_evolution_time / generator_n_pop if generator_n_pop > 0 else 0
        
        generator_time_info = getattr(self.eoh, '_last_generator_eoh_time_info', {})
        self._generator_code_generation_time = generator_time_info.get('code_generation_time', None)
        self._generator_evaluation_time = generator_time_info.get('evaluation_time', None)
        
        # Update generator EOH generation for next round
        generator_n_pop = getattr(self.cfg, 'generator_n_pop', getattr(self.cfg, 'n_pop', 2))
        self._generator_eoh_generation += generator_n_pop
        
        # Handle top-k results
        def add_generator(id, code, algorithm, params, score):
            metadata = {"source": "br_generator_sigmaH", "score": score}
            self.pools.add_generator(id, code, algorithm, params, metadata)
        
        success, added_candidate = self._handle_top_k_candidates(
            generator_results, "generator", add_generator, None
        )
        
        if success and added_candidate:
            gen_code, gen_algorithm, gen_params, generator_score = added_candidate
            return {
                "code": gen_code,
                "algorithm": gen_algorithm,
                "params": gen_params,
                "score": generator_score
            }, generator_score
        raise ValueError("No generator candidates available")
    
    def _handle_top_k_candidates(self, candidates, candidate_type: str, 
                                 add_func, check_func=None) -> Tuple[bool, Any]:
        """
        Generic handler for top-k candidate selection and addition.
        
        Args:
            candidates: List of candidates or single candidate
            candidate_type: "solver" or "generator" (for logging)
            add_func: Callable to add candidate
                     Signature: add_func(id, code, algorithm, params, score)
                     - params can be empty dict {} for solver
            check_func: Unused (kept for backward compatibility)
        
        Returns:
            (success: bool, candidate_data: tuple)
            - success: Whether a candidate was successfully added
            - candidate_data: The data of the added candidate (or None if failed)
        """
        def validate_score(score):
            if candidate_type == "solver":
                use_gap = getattr(self.cfg, 'solver_use_gap', None)
                max_score = 1e6 if (use_gap is not None and not use_gap) else 1e2
            else:
                max_score = 1e2  
            
            if abs(score) >= max_score or not np.isfinite(score):
                print(f"       Rejected: Score too large (likely evaluation error): {score:.4f}")
                return False
            if max_score <= 1e2 and score > 1000:
                print(f"       Rejected: Score unexpectedly positive and large: {score:.4f}")
                return False
            return True
        
        def try_add_candidate(candidate, candidate_id):
            try:
                code, algorithm, params, score = candidate
                add_func(candidate_id, code, algorithm, params, score)
                return True, candidate
            except ValueError as e:
                print(f"      Rejected: {str(e)}")
                return False, None
        
        if not isinstance(candidates, list):
            candidates = [candidates]
        
        if len(candidates) > 1:
            print(f"     Received {len(candidates)} {candidate_type} candidates")
        
        for idx, candidate in enumerate(candidates):
            code, algorithm, params, score = candidate
            
            if not validate_score(score):
                continue
            
            if candidate_type == 'solver':
                candidate_id = f"h{self.pools.n_solvers}"
            else:
                candidate_id = f"g{self.pools.n_generators}"
            
            if len(candidates) == 1:
                print(f"    Single {candidate_type} candidate score: {score:.4f}")
            else:
                print(f"    Attempting to add {candidate_type} candidate {idx+1}/{len(candidates)}")
            
            success, added_candidate = try_add_candidate(candidate, candidate_id)
            if success:
                return True, added_candidate
        
        if len(candidates) > 1:
            print(f"     All {len(candidates)} candidates were rejected")
        return False, None
    
    def _get_new_indices(self) -> Tuple[List[int], List[int]]:
        n_h, n_g = self.meta.utilities.shape
        new_h = list(range(n_h, self.pools.n_solvers))
        new_g = list(range(n_g, self.pools.n_generators))
        
        if n_h == self.pools.n_solvers and n_g == self.pools.n_generators:
            new_h = []
            new_g = []
            for hi in range(self.pools.n_solvers):
                for gj in range(self.pools.n_generators):
                    if (hi, gj) not in self._utility_cache:
                        if hi not in new_h:
                            new_h.append(hi)
                        if gj not in new_g:
                            new_g.append(gj)
        
        return new_h, new_g

    def _update_utilities_incremental(self, new_h: List[int], new_g: List[int]) -> None:
        total_pairs = len(new_h) * self.pools.n_generators + len(new_g) * self.pools.n_solvers
        
        if total_pairs == 0:
            return
        
        tasks = []
        cache_hits = {} 
        
        for hi in new_h:
            for gj in range(self.pools.n_generators):
                cache_key = (hi, gj)
                if cache_key in self._utility_cache:
                    cache_hits[cache_key] = self._utility_cache[cache_key]
                else:
                    tasks.append((hi, gj))
        
        for gj in new_g:
            for hi in range(self.pools.n_solvers):
                if hi not in new_h:
                    cache_key = (hi, gj)
                    if cache_key in self._utility_cache:
                        cache_hits[cache_key] = self._utility_cache[cache_key]
                    else:
                        tasks.append((hi, gj))
        
        for (hi, gj), gap in cache_hits.items():
            self.meta.set_utility(hi, gj, gap)
        
        if not tasks:
            return
        
        import hashlib
        
        task_data = []
        base_seed = self.cfg.seed if self.cfg.seed is not None else 42
        
        for hi, gj in tasks:
            try:
                code = self.pools.get_solver(hi).code
                
                seed_key = f"{hi}_{gj}_{base_seed}"
                seed = int(hashlib.md5(seed_key.encode()).hexdigest()[:8], 16) % (2**31)
                
                np.random.seed(seed)
                instances = self.problem_sampler.sample_from_single_generator(gj, n=self.cfg.eval_n_instances)
                
                if len(instances) == 0:
                    print(f"    [UtilityUpdate] WARNING: No instances generated for generator {gj}")
                
                task_data.append((hi, gj, code, instances))
            except Exception as e:
                print(f"      Warning: Failed to prepare task ({hi}, {gj}): {e}")
                task_data.append((hi, gj, None, None))
        
        def eval_single_task(args):
            hi, gj, code_str, instances = args
            if code_str is None or instances is None:
                return hi, gj, 1e9, "Code or instances retrieval failed"
            try:
                gap = self.problem_adapter.evaluate_solver(code_str, instances, utility_cache=self._utility_cache)
                return hi, gj, gap, None
            except Exception as e:
                return hi, gj, 1e9, str(e)
        
        n_jobs = getattr(self.cfg, 'eval_n_jobs', -1)
        
        instance_time_limit = getattr(self.cfg, 'instance_solver_time_limit', 60)
        oracle_timeout = getattr(self.cfg, 'oracle_timeout', 0)   
        timeout_per_task = instance_time_limit + oracle_timeout + 10
        batch_timeout = len(task_data) * timeout_per_task * 1.5 if task_data else None
        
        try:
            results = Parallel(
                n_jobs=n_jobs,
                # backend="threading",
                backend="loky",
                prefer="processes", 
                # prefer="threads",
                pre_dispatch="2*n_jobs",
                batch_size="auto",
                timeout=batch_timeout,
            )(
                delayed(eval_single_task)(args) for args in task_data
            )
        except Exception as e:
            print(f"      Warning: Parallel evaluation failed ({e}), falling back to sequential")
            results = [eval_single_task(args) for args in task_data]
        
        for hi, gj, gap, error in results:
            if error is not None:
                print(f"      Warning: Evaluation failed for ({hi}, {gj}): {error}")
                gap = 1e9  
            if gap == 0.0 or (np.isnan(gap) and hi > 0 and gj > 0) or (np.isinf(gap) and abs(gap) < 1e8):
                print(f"    [UtilityUpdate] WARNING: Unexpected gap value for ({hi}, {gj}): {gap}")
            
            self._utility_cache[(hi, gj)] = gap
            self.meta.set_utility(hi, gj, gap)
        print(f"    U-update: hits={len(cache_hits)}, tasks={len(tasks)}, n_jobs={n_jobs}")