from __future__ import annotations

from dataclasses import dataclass
from typing import Optional

from ...core.config import HeuPSROConfig
 

@dataclass
class BPOnlineConfig(HeuPSROConfig):
    """BP Online 任务特定配置 - 继承通用配置"""
    
    # === BP Online 任务参数 ===
    capacity: int = 100  
    num_items: int = 50  

    # # # da: bool = True 
    solver_n_pop: int = 4  # number of evolution generations for solver EOH
    generator_n_pop: int = 2  # number of evolution generations for generator EOH
    eoh_eval_n_instances: int = 2   # number of instances for EOH individual evaluation 
    eval_n_instances: int = 2 # number of instances to use for utility matrix evaluation 
    eoh_objective_precision: int = 2




    # === BP Online ===
    instance_solver_time_limit: int = 5  # BP Online solver time limit per instance (seconds)
    psro_use_latest_only: bool = False  # only use the latest strategy in the pool (instead of Nash equilibrium mixed)
    evolution_context_enabled: bool = False
    # === Oracle ===
    oracle_type: str = "cp-sat"  # "lb" (lower bound), "cp-sat" (exact solution), or "none"
    oracle_timeout: int = 240  # CP-SAT solution timeout (seconds)
    pop_size: int = 20

    meta_game_solver: str = "alpha_rank"
    alpha_rank_alpha: float = 7.5
    min_simple_ratio: float = 0.3

    # eoh_management_strategy: str = "pop_greedy"

    eoh_framework_timeout: int = 900

    # === Batch evaluation parameters ===
    batch_eval_task_batch_size: Optional[int] = None  

    debug_mode: bool = False
    eoh_management_strategy: str = "pop_greedy"
