from __future__ import annotations

from dataclasses import dataclass, field
from typing import Optional, List


@dataclass
class HeuPSROConfig:
    max_rounds: int = 8
    min_simple_ratio: float = 0.3  # lower bound for simple/baseline generator sampling share
    
    seed: Optional[int] = 42
    
    # === EOH  ===
    eoh_time_budget_minutes: int = 5  # optional time budget per run
    pop_size: int = 10 # population size for each generation
    # n_pop: int = 2  # number of evolution generations (deprecated, use solver_n_pop and generator_n_pop instead)
    solver_n_pop: int = 2  # number of evolution generations for solver EOH
    generator_n_pop: int = 2  # number of evolution generations for generator EOH
    # EOH operator parent count (used by 'e1'/'e2' operators)
    ec_m: int = 2
    # EOH operator set (e1/e2: crossover variants; m1/m2/m3: mutations)
    ec_operators: List[str] = field(default_factory=lambda: ["e1","e2","m1","m2","m3"]) # field(default_factory=lambda: ["e1","e2","m1","m2","m3"])  # e.g., ["e1","e2","m1","m2","m3"]
        
  
    psro_use_latest_only: bool = False  
    meta_game_solver: str = "ne"  # Meta-game: "ne"  or "alpha_rank" (Alpha-Rank)
    # Alpha-Rank 
    alpha_rank_alpha: float = 12.0  # selection intensity
    alpha_rank_num_iters: int = 10_000  # power iteration 
    alpha_rank_tol: float = 1e-10  

    evolution_context_enabled: bool = False  
    disable_generator_evolution: bool = False
    
    eoh_eval_n_instances: int = 3  # number of instances for EOH individual evaluation
    eval_n_instances: int = 3  # number of instances to use for utility matrix evaluation 
    
    eoh_framework_timeout: int = 300  # EoH framework-level evaluation timeout (seconds)
                                       # Should be >= (instance_solver_time_limit * n_instances + oracle_timeout + buffer)
                                       # For TSP: >= (60 * 3 + 30 + 50) = 260s
                                       # For BP: >= (5 * 3 + 0 + 20) = 35s
    instance_solver_time_limit: int = 60  # Time limit for solving a single instance (seconds)
                                           # TSP: GLS solver time limit
                                           # BP: Bin packing time limit (usually very fast, ~1-5s)
    
    eva_numba_decorator: bool = False
    
    exp_n_proc: int = 128  # number of processes 
    eval_n_jobs: int = 128  
    optimal_parallel_n_jobs: int = 150  # Optimal(oracle)
    parallel_backend: str = "loky"  
    parallel_prefer: str = "processes" 
    
    # === LLM  ===
    llm_model: str = "--"
    llm_api_endpoint: str = "api.deepseek.com"
    llm_api_key: str = "--"

    llm_temperature: float = 1  
    llm_top_p: float = 0.6  

    llm_use_local: bool = False
    
    llm_use_async: bool = True  
    llm_max_concurrent_requests: int = 10 
    llm_rate_limit_per_minute: int = 60 

    # === Generator ===
    generator_use_gap: bool = True 
    
    # === Data Augmentation ===
    da: bool = False 

    # === EOH Diversity ===
    # eoh_diversity_enabled: bool = False   
    eoh_diversity_threshold: float = 0.8 
    eoh_management_strategy: str = "pop_diverse" 
    eoh_objective_precision: int = 3 
    eoh_max_per_objective: int = 1 
    
    # === PSRO Diversity===
    psro_diversity_enabled: bool = True     
    psro_code_similarity_threshold: float = 0.8 
    psro_behavioral_diversity_threshold: float = 0.7 
    psro_max_pool_size_solver: int = 50 
    psro_max_pool_size_generator: int = 50 
    psro_diversity_weight_code: float = 0.5 
    psro_diversity_weight_behavior: float = 0.5 
    
    psro_use_top_k: bool = True 
    psro_top_k: int =10 
    
    experiment_name: str = "psro_experiment"
    save_frequency: int = 1  
    log_frequency: int = 1  
    debug_mode: bool = False
    exp_debug_mode: bool = False
