from __future__ import annotations

import numpy as np
import hashlib
from typing import List, Optional, Dict, Tuple

from ..shared.batch_eval import batch_evaluate_tasks, evaluate_single_solver_instance, prepare_tasks


class CVRPSolverProblem:
    """Evaluate solver code using batch evaluation with Strategy C (separate evaluate + weighted sum).

    Uses unified prepare_tasks function from shared module.
    """

    def __init__(
        self,
        config,  
        generator_codes: List[str] = None,
        generator_ids: List[int] = None,
        generator_weights: np.ndarray = None,
        num_customers: int = None,
        n_inst_eva: int = None,  # 可选覆盖
    ):
        """Initialize CVRP Solver Problem.
        
        Args:
            config: HeuPSROConfig 
            generator_codes: Generator code strings 
            generator_ids: Generator IDs 
            generator_weights: Generator weights
            num_customers: Number of customers 
            n_inst_eva: Number of instances
        """
        self.config = config 
        self.generator_codes = generator_codes or []
        self.generator_ids = generator_ids or []
        self.generator_weights = generator_weights if generator_weights is not None else np.array([])
        self.num_customers = num_customers
        
        self.n_inst_eva = n_inst_eva or config.eoh_eval_n_instances
        self.time_limit = getattr(config, 'instance_solver_time_limit', 30)
        self.use_gap = getattr(config, 'generator_use_gap', True)
        self.gap_oracle = getattr(config, 'oracle_type', 'ortools')
        self.gap_oracle_timeout = getattr(config, 'oracle_timeout', 60)
        self.debug_mode = getattr(config, 'debug_mode', False)
        self.parallel_backend = getattr(config, 'parallel_backend', 'loky')
        self.parallel_prefer = getattr(config, 'parallel_prefer', 'processes')
        self.parallel_n_jobs = getattr(config, 'eval_n_jobs', -1)
        self.max_iterations = getattr(config, 'ls_max_iterations', 1000)
        self.max_stagnation = getattr(config, 'ls_max_stagnation', 10)
        self.vehicle_capacity = getattr(config, 'vehicle_capacity', 100)
        self.num_vehicles = getattr(config, 'num_vehicles', None)
        
        # Cache for instances and oracle costs (within same PSRO round)
        self._cached_instances = None
        self._cached_oracle_costs = None
        self._cache_key = None
        
        # Add prompts attribute that EoH might expect
        from .prompts import GetPrompts
        self.prompts = GetPrompts()
    
    def set_evolution_context(self, context: str = None, enabled: bool = True) -> None:
        """
        Set evolution context for PSRO-level task description.
        
        Args:
            context: Context string describing the mixed generator distribution
            enabled: Whether to use context in prompts
        """
        if hasattr(self, 'prompts') and self.prompts is not None:
            self.prompts.set_context(context, enabled)

    def evaluate(self, code_string: str, n_instances: int = None) -> float:
        """Evaluate single solver (backward compatibility)."""
        return self.evaluate_batch([code_string])[0]
    
    def evaluate_batch(self, code_strings: List[str]) -> List[float]:
        """
        batch evaluate multiple solver codes.
        
        Args:
            code_strings: List of solver code strings [code_0, code_1, ..., code_n-1]
            
        Returns:
            List of fitness values [fitness_0, fitness_1, ..., fitness_n-1]
        """
        n_solvers = len(code_strings)
        solver_ids = list(range(n_solvers))
        
        # Generate cache key based on generator configuration
        cache_key_data = (
            tuple(self.generator_codes),
            tuple(self.generator_ids),
            tuple(self.generator_weights.flatten() if len(self.generator_weights.shape) > 0 else [self.generator_weights]),
            self.n_inst_eva,
            self.num_customers,
            self.use_gap,
            self.gap_oracle
        )
        cache_key = hashlib.md5(str(cache_key_data).encode()).hexdigest()
        
        # Check if cache is valid
        use_cache = (self._cache_key == cache_key and 
                    self._cached_instances is not None and
                    (not self.use_gap or self._cached_oracle_costs is not None))
        
        if use_cache:
            # Use cached instances and oracle
            all_tasks, _, _ = prepare_tasks(
                solver_codes=code_strings,
                solver_ids=solver_ids,
                generator_codes=self.generator_codes,
                generator_ids=self.generator_ids,
                generator_weights=self.generator_weights,
                n_instances=self.n_inst_eva,
                num_customers=self.num_customers,
                vehicle_capacity=self.vehicle_capacity,
                num_vehicles=self.num_vehicles,
                time_limit=self.time_limit,
                use_gap=self.use_gap,
                gap_oracle=self.gap_oracle,
                oracle_timeout=self.gap_oracle_timeout,
                optimal_parallel_n_jobs=getattr(self.config, 'optimal_parallel_n_jobs', -1),
                debug_mode=self.debug_mode,
                cached_instances=self._cached_instances,
                cached_oracle_costs=self._cached_oracle_costs,
                config=self.config,
                max_iterations=self.max_iterations,
                max_stagnation=self.max_stagnation,
                random_seed=getattr(self.config, 'seed', None)
            )
        else:
            # Generate new instances and oracle
            all_tasks, all_instances_by_gen, oracle_costs_dict = prepare_tasks(
                solver_codes=code_strings,
                solver_ids=solver_ids,
                generator_codes=self.generator_codes,
                generator_ids=self.generator_ids,
                generator_weights=self.generator_weights,
                n_instances=self.n_inst_eva,
                num_customers=self.num_customers,
                vehicle_capacity=self.vehicle_capacity,
                num_vehicles=self.num_vehicles,
                time_limit=self.time_limit,
                use_gap=self.use_gap,
                gap_oracle=self.gap_oracle,
                oracle_timeout=self.gap_oracle_timeout,
                optimal_parallel_n_jobs=getattr(self.config, 'optimal_parallel_n_jobs', -1),
                debug_mode=self.debug_mode,
                cached_instances=None,
                cached_oracle_costs=None,
                config=self.config,
                max_iterations=self.max_iterations,
                max_stagnation=self.max_stagnation,
                random_seed=getattr(self.config, 'seed', None)
            )
            
            # Cache the results
            self._cached_instances = all_instances_by_gen
            self._cached_oracle_costs = oracle_costs_dict
            self._cache_key = cache_key
        
        # Step 2: call shared batch evaluation
        timeout_per_task = self.time_limit + self.gap_oracle_timeout + 10
        batch_timeout = len(all_tasks) * timeout_per_task * 1.5 if all_tasks else None
        results_dict = batch_evaluate_tasks(
            tasks=all_tasks,
            evaluate_fn=evaluate_single_solver_instance,
            n_jobs=self.parallel_n_jobs,
            backend=self.parallel_backend,
            prefer=self.parallel_prefer,
            timeout=batch_timeout,
            debug_mode=self.debug_mode,
            track_time=True,
            time_key="solver"
        )
        
        # Step 3: weight by weight and sum
        solver_fitnesses = [1e9] * n_solvers
        for solver_id in range(n_solvers):
            weighted_sum = 0.0
            for gen_idx, gen_id in enumerate(self.generator_ids):
                mean_gap = results_dict.get((solver_id, gen_id), 1e9)
                # Handle None values: if mean_gap is None, use default value
                if mean_gap is None:
                    mean_gap = 1e9
                weight = self.generator_weights[gen_idx] if gen_idx < len(self.generator_weights) else 0.0
                weighted_sum += weight * mean_gap
            
            solver_fitnesses[solver_id] = float(weighted_sum)
        
        return solver_fitnesses




