"""
Main controller for OpenEvolve
"""

import asyncio
import json
import logging
import os
import shutil
import signal
import time
import uuid
from pathlib import Path
from typing import Any, Dict, List, Optional, Union

from openevolve.config import Config, load_config
from openevolve.database import Program, ProgramDatabase
from openevolve.evaluator import Evaluator
from openevolve.evolution_trace import EvolutionTracer
from openevolve.llm.ensemble import LLMEnsemble
from openevolve.process_parallel import ProcessParallelController
from openevolve.prompt.sampler import PromptSampler
from openevolve.utils.code_utils import extract_code_language
from openevolve.utils.format_utils import format_improvement_safe, format_metrics_safe
from openevolve.utils.metrics_utils import get_fitness_score
from openevolve.utils.wandb_logger import create_wandb_logger, flatten_scalars

logger = logging.getLogger(__name__)


def _format_metrics(metrics: Dict[str, Any]) -> str:
    """Safely format metrics, handling both numeric and string values"""
    formatted_parts = []
    for name, value in metrics.items():
        if isinstance(value, (int, float)) and not isinstance(value, bool):
            try:
                formatted_parts.append(f"{name}={value:.4f}")
            except (ValueError, TypeError):
                formatted_parts.append(f"{name}={value}")
        else:
            formatted_parts.append(f"{name}={value}")
    return ", ".join(formatted_parts)


def _format_improvement(improvement: Dict[str, Any]) -> str:
    """Safely format improvement metrics"""
    formatted_parts = []
    for name, diff in improvement.items():
        if isinstance(diff, (int, float)) and not isinstance(diff, bool):
            try:
                formatted_parts.append(f"{name}={diff:+.4f}")
            except (ValueError, TypeError):
                formatted_parts.append(f"{name}={diff}")
        else:
            formatted_parts.append(f"{name}={diff}")
    return ", ".join(formatted_parts)


class OpenEvolve:
    """
    Main controller for OpenEvolve

    Orchestrates the evolution process, coordinating between the prompt sampler,
    LLM ensemble, evaluator, and program database.

    Features:
    - Tracks the absolute best program across evolution steps
    - Ensures the best solution is not lost during the MAP-Elites process
    - Always includes the best program in the selection process for inspiration
    - Maintains detailed logs and metadata about improvements
    """

    def __init__(
        self,
        initial_program_path: str,
        evaluation_file: str,
        config: Config,
        output_dir: Optional[str] = None,
    ):
        # Load configuration (loaded in main_async)
        self.config = config

        # Set up output directory
        self.output_dir = output_dir or os.path.join(
            os.path.dirname(initial_program_path), "openevolve_output"
        )
        os.makedirs(self.output_dir, exist_ok=True)

        # Set up logging
        self._setup_logging()

        # Manual mode queue lives in <openevolve_output>/manual_tasks_queue
        self._setup_manual_mode_queue()

        # Set random seed for reproducibility if specified
        if self.config.random_seed is not None:
            import hashlib
            import random

            import numpy as np

            # Set global random seeds
            random.seed(self.config.random_seed)
            np.random.seed(self.config.random_seed)

            # Create hash-based seeds for different components
            base_seed = str(self.config.random_seed).encode("utf-8")
            llm_seed = int(hashlib.md5(base_seed + b"llm").hexdigest()[:8], 16) % (2**31)

            # Propagate seed to LLM configurations
            self.config.llm.random_seed = llm_seed
            for model_cfg in self.config.llm.models:
                if not hasattr(model_cfg, "random_seed") or model_cfg.random_seed is None:
                    model_cfg.random_seed = llm_seed
            for model_cfg in self.config.llm.evaluator_models:
                if not hasattr(model_cfg, "random_seed") or model_cfg.random_seed is None:
                    model_cfg.random_seed = llm_seed

            logger.info(f"Set random seed to {self.config.random_seed} for reproducibility")
            logger.debug(f"Generated LLM seed: {llm_seed}")

        # Load initial program
        self.initial_program_path = initial_program_path
        self.initial_program_code = self._load_initial_program()
        if not self.config.language:
            self.config.language = extract_code_language(self.initial_program_code)

        # Extract file extension from initial program
        self.file_extension = os.path.splitext(initial_program_path)[1]
        if not self.file_extension:
            # Default to .py if no extension found
            self.file_extension = ".py"
        else:
            # Make sure it starts with a dot
            if not self.file_extension.startswith("."):
                self.file_extension = f".{self.file_extension}"

        # Set the file_suffix in config (can be overridden in YAML)
        if not hasattr(self.config, "file_suffix") or self.config.file_suffix == ".py":
            self.config.file_suffix = self.file_extension

        # Initialize components
        self.llm_ensemble = LLMEnsemble(self.config.llm.models)
        self.llm_evaluator_ensemble = LLMEnsemble(self.config.llm.evaluator_models)

        self.prompt_sampler = PromptSampler(self.config.prompt)
        self.evaluator_prompt_sampler = PromptSampler(self.config.prompt)
        self.evaluator_prompt_sampler.set_templates("evaluator_system_message")

        # Pass random seed to database if specified
        if self.config.random_seed is not None:
            self.config.database.random_seed = self.config.random_seed

        self.config.database.novelty_llm = self.llm_ensemble
        self.database = ProgramDatabase(self.config.database)

        self.evaluator = Evaluator(
            self.config.evaluator,
            evaluation_file,
            self.llm_evaluator_ensemble,
            self.evaluator_prompt_sampler,
            database=self.database,
            suffix=Path(self.initial_program_path).suffix,
        )
        self.evaluation_file = evaluation_file

        logger.info(f"Initialized OpenEvolve with {initial_program_path}")

        # Initialize evolution tracer
        if self.config.evolution_trace.enabled:
            trace_output_path = self.config.evolution_trace.output_path
            if not trace_output_path:
                # Default to output_dir/evolution_trace.{format}
                trace_output_path = os.path.join(
                    self.output_dir, f"evolution_trace.{self.config.evolution_trace.format}"
                )

            self.evolution_tracer = EvolutionTracer(
                output_path=trace_output_path,
                format=self.config.evolution_trace.format,
                include_code=self.config.evolution_trace.include_code,
                include_prompts=self.config.evolution_trace.include_prompts,
                enabled=True,
                buffer_size=self.config.evolution_trace.buffer_size,
                compress=self.config.evolution_trace.compress,
            )
            logger.info(f"Evolution tracing enabled: {trace_output_path}")
        else:
            self.evolution_tracer = None

        # Initialize improved parallel processing components
        self.parallel_controller = None
        self.wandb_logger = create_wandb_logger(self.config.wandb, self.output_dir)
        self._best_fitness_so_far: Optional[float] = None
        self._run_started_at: Optional[float] = None

    def _setup_logging(self) -> None:
        """Set up logging"""
        log_dir = self.config.log_dir or os.path.join(self.output_dir, "logs")
        os.makedirs(log_dir, exist_ok=True)

        # Set up root logger
        root_logger = logging.getLogger()
        root_logger.setLevel(getattr(logging, self.config.log_level))

        # Add file handler
        log_file = os.path.join(log_dir, f"openevolve_{time.strftime('%Y%m%d_%H%M%S')}.log")
        file_handler = logging.FileHandler(log_file)
        file_handler.setFormatter(
            logging.Formatter("%(asctime)s - %(name)s - %(levelname)s - %(message)s")
        )
        root_logger.addHandler(file_handler)

        # Add console handler
        console_handler = logging.StreamHandler()
        console_handler.setFormatter(logging.Formatter("%(asctime)s - %(levelname)s - %(message)s"))
        root_logger.addHandler(console_handler)

        logger.info(f"Logging to {log_file}")

    def _setup_manual_mode_queue(self) -> None:
        """
        Set up manual task queue directory if llm.manual_mode is enabled

        Queue directory is always:
          <openevolve_output>/manual_tasks_queue

        The directory is cleared on controller start so the UI shows only tasks
        from the current run (no stale tasks after restart)
        """
        if not bool(getattr(self.config.llm, "manual_mode", False)):
            return

        qdir = (Path(self.output_dir).expanduser().resolve() / "manual_tasks_queue")

        # Clear stale tasks from previous runs
        if qdir.exists():
            shutil.rmtree(qdir)
        qdir.mkdir(parents=True, exist_ok=True)

        # Inject runtime-only queue dir into configs
        self.config.llm._manual_queue_dir = str(qdir)
        for model_cfg in self.config.llm.models:
            model_cfg._manual_queue_dir = str(qdir)
        for model_cfg in self.config.llm.evaluator_models:
            model_cfg._manual_queue_dir = str(qdir)

        logger.info(f"Manual mode enabled. Queue dir: {qdir}")

    def _load_initial_program(self) -> str:
        """Load the initial program from file"""
        with open(self.initial_program_path, "r") as f:
            return f.read()

    def _get_program_fitness(self, program: Optional[Program]) -> Optional[float]:
        if program is None or not program.metrics:
            return None
        return get_fitness_score(program.metrics, self.database.config.feature_dimensions)

    def _build_wandb_run_metadata(
        self,
        *,
        checkpoint_path: Optional[str],
        max_iterations: int,
        target_score: Optional[float],
    ) -> Dict[str, Any]:
        metadata = {
            "mode": "single-task",
            "initial_program_path": str(Path(self.initial_program_path).resolve()),
            "evaluation_file": str(Path(self.evaluation_file).resolve()),
            "output_dir": str(Path(self.output_dir).resolve()),
            "requested_iterations": max_iterations,
            "target_score": target_score,
        }
        if checkpoint_path:
            metadata["checkpoint_path"] = str(Path(checkpoint_path).resolve())
        return metadata

    def _log_single_task_metrics(
        self,
        *,
        iteration: int,
        metrics: Dict[str, Any],
        step: Optional[int] = None,
    ) -> None:
        payload = {"iteration": iteration}
        payload.update(flatten_scalars(metrics))
        self.wandb_logger.log_metrics(payload, step=step if step is not None else iteration)

    def _log_best_program_artifact(self, program: Program) -> None:
        paths = self._save_best_program(program)
        if not paths:
            return

        fitness = self._get_program_fitness(program)
        artifact_metadata = {
            "iteration": program.iteration_found,
            "fitness": fitness,
            "metrics": flatten_scalars(program.metrics),
            "program_id": program.id,
        }
        self.wandb_logger.log_best_program_artifact(
            paths["code_path"],
            metadata=artifact_metadata,
        )

    def _handle_parallel_iteration_event(self, event: Dict[str, Any]) -> None:
        iteration = int(event["iteration"])
        event_type = event.get("event")
        best_program = self.database.get_best_program()
        best_fitness = self._get_program_fitness(best_program)

        if event_type != "success":
            previous_best = self._best_fitness_so_far
            if best_fitness is not None:
                self._best_fitness_so_far = best_fitness
            self._log_single_task_metrics(
                iteration=iteration,
                metrics={
                    "evaluation_success": 0,
                    "best_fitness_so_far": best_fitness,
                    "delta_best_fitness": 0.0,
                    "failure_type": event_type,
                    "error": event.get("error"),
                    "timeout_seconds": event.get("timeout_seconds"),
                },
            )
            if previous_best is None and best_fitness is not None:
                self.wandb_logger.update_summary({"best_fitness": best_fitness})
            return

        child_program = event["child_program"]
        current_fitness = self._get_program_fitness(child_program)
        previous_best = self._best_fitness_so_far
        if best_fitness is None:
            best_fitness = current_fitness

        delta_best = 0.0
        if best_fitness is not None:
            if previous_best is None:
                delta_best = best_fitness
            else:
                delta_best = max(0.0, best_fitness - previous_best)
            self._best_fitness_so_far = best_fitness

        metric_payload: Dict[str, Any] = {
            "current_fitness": current_fitness,
            "best_fitness_so_far": best_fitness,
            "delta_best_fitness": delta_best,
            "evaluation_success": 1,
            "iteration_time_sec": event.get("iteration_time_sec"),
            "generation_time_sec": event.get("generation_time_sec"),
            "evaluation_time_sec": event.get("evaluation_time_sec"),
            "parent_id": getattr(event.get("parent_program"), "id", None),
            "program_id": child_program.id,
        }
        if child_program.complexity:
            metric_payload["complexity"] = child_program.complexity
        if child_program.diversity:
            metric_payload["diversity"] = child_program.diversity
        metric_payload.update(
            {
                key: value
                for key, value in flatten_scalars(child_program.metrics).items()
                if key not in metric_payload
            }
        )

        self._log_single_task_metrics(iteration=iteration, metrics=metric_payload)

        if event.get("is_new_best"):
            self._log_best_program_artifact(child_program)
            self.wandb_logger.update_summary(
                {
                    "best_fitness": best_fitness,
                    "best_iteration": child_program.iteration_found,
                }
            )

    def _write_summary(
        self,
        *,
        best_program: Optional[Program],
        wall_clock_time_sec: Optional[float],
    ) -> Dict[str, Any]:
        best_fitness = self._get_program_fitness(best_program)
        summary = {
            "output_dir": str(Path(self.output_dir).resolve()),
            "initial_program_path": str(Path(self.initial_program_path).resolve()),
            "evaluation_file": str(Path(self.evaluation_file).resolve()),
            "total_iterations": self.database.last_iteration,
            "wall_clock_time_sec": wall_clock_time_sec,
            "best_program_id": best_program.id if best_program else None,
            "best_iteration": best_program.iteration_found if best_program else None,
            "best_fitness": best_fitness,
            "best_metrics": best_program.metrics if best_program else None,
        }

        summary_path = Path(self.output_dir) / "summary.json"
        with open(summary_path, "w") as handle:
            json.dump(summary, handle, indent=2)

        summary["summary_path"] = str(summary_path)
        return summary

    async def run(
        self,
        iterations: Optional[int] = None,
        target_score: Optional[float] = None,
        checkpoint_path: Optional[str] = None,
    ) -> Optional[Program]:
        """
        Run the evolution process with improved parallel processing

        Args:
            iterations: Maximum number of iterations (uses config if None)
            target_score: Target score to reach (continues until reached if specified)
            checkpoint_path: Path to resume from checkpoint

        Returns:
            Best program found
        """
        max_iterations = iterations or self.config.max_iterations
        self._run_started_at = time.time()

        self.wandb_logger.init_run(
            run_mode="single-task",
            config_payload=self.config,
            metadata=self._build_wandb_run_metadata(
                checkpoint_path=checkpoint_path,
                max_iterations=max_iterations,
                target_score=target_score,
            ),
            step_metric="iteration",
        )

        try:
            # Determine starting iteration
            start_iteration = 0
            if checkpoint_path and os.path.exists(checkpoint_path):
                self._load_checkpoint(checkpoint_path)
                start_iteration = self.database.last_iteration + 1
                logger.info(f"Resuming from checkpoint at iteration {start_iteration}")
            else:
                start_iteration = self.database.last_iteration

            self._best_fitness_so_far = self._get_program_fitness(self.database.get_best_program())

            # Only add initial program if starting fresh (not resuming from checkpoint)
            should_add_initial = (
                start_iteration == 0
                and len(self.database.programs) == 0
                and not any(
                    p.code == self.initial_program_code for p in self.database.programs.values()
                )
            )

            if should_add_initial:
                logger.info("Adding initial program to database")
                initial_program_id = str(uuid.uuid4())

                # Evaluate the initial program
                initial_metrics = await self.evaluator.evaluate_program(
                    self.initial_program_code, initial_program_id
                )

                initial_program = Program(
                    id=initial_program_id,
                    code=self.initial_program_code,
                    changes_description=self.config.prompt.initial_changes_description,
                    language=self.config.language,
                    metrics=initial_metrics,
                    iteration_found=start_iteration,
                )

                self.database.add(initial_program)
                initial_artifacts = self.evaluator.get_pending_artifacts(initial_program_id)
                if initial_artifacts:
                    self.database.store_artifacts(initial_program.id, initial_artifacts)
                self._best_fitness_so_far = self._get_program_fitness(initial_program)
                self._log_single_task_metrics(
                    iteration=0,
                    metrics={
                        "current_fitness": self._best_fitness_so_far,
                        "best_fitness_so_far": self._best_fitness_so_far,
                        "delta_best_fitness": self._best_fitness_so_far or 0.0,
                        "evaluation_success": 1,
                        **flatten_scalars(initial_metrics),
                    },
                    step=0,
                )

                # Check if combined_score is present in the metrics
                if "combined_score" not in initial_metrics:
                    # Calculate average of numeric metrics
                    numeric_metrics = [
                        v
                        for v in initial_metrics.values()
                        if isinstance(v, (int, float)) and not isinstance(v, bool)
                    ]
                    if numeric_metrics:
                        avg_score = sum(numeric_metrics) / len(numeric_metrics)
                        logger.warning(
                            f"⚠️  No 'combined_score' metric found in evaluation results. "
                            f"Using average of all numeric metrics ({avg_score:.4f}) for evolution guidance. "
                            f"For better evolution results, please modify your evaluator to return a 'combined_score' "
                            f"metric that properly weights different aspects of program performance."
                        )
            else:
                logger.info(
                    f"Skipping initial program addition (resuming from iteration {start_iteration} "
                    f"with {len(self.database.programs)} existing programs)"
                )

            # Initialize improved parallel processing
            try:
                self.parallel_controller = ProcessParallelController(
                    self.config,
                    self.evaluation_file,
                    self.database,
                    self.evolution_tracer,
                    file_suffix=self.config.file_suffix,
                    iteration_callback=self._handle_parallel_iteration_event,
                )

                # Set up signal handlers for graceful shutdown
                def signal_handler(signum, frame):
                    logger.info(f"Received signal {signum}, initiating graceful shutdown...")
                    self.parallel_controller.request_shutdown()

                    # Set up a secondary handler for immediate exit if user presses Ctrl+C again
                    def force_exit_handler(signum, frame):
                        logger.info("Force exit requested - terminating immediately")
                        import sys

                        sys.exit(0)

                    signal.signal(signal.SIGINT, force_exit_handler)

                signal.signal(signal.SIGINT, signal_handler)
                signal.signal(signal.SIGTERM, signal_handler)

                self.parallel_controller.start()

                # When starting from iteration 0, we've already done the initial program evaluation
                # So we need to adjust the start_iteration for the actual evolution
                evolution_start = start_iteration
                evolution_iterations = max_iterations

                # If we just added the initial program at iteration 0, start evolution from iteration 1
                if should_add_initial and start_iteration == 0:
                    evolution_start = 1
                    # User expects max_iterations evolutionary iterations AFTER the initial program
                    # So we don't need to reduce evolution_iterations

                # Run evolution with improved parallel processing and checkpoint callback
                await self._run_evolution_with_checkpoints(
                    evolution_start, evolution_iterations, target_score
                )

            finally:
                # Clean up parallel processing resources
                if self.parallel_controller:
                    self.parallel_controller.stop()
                    self.parallel_controller = None

                # Close evolution tracer
                if self.evolution_tracer:
                    self.evolution_tracer.close()
                    logger.info("Evolution tracer closed")

            # Get the best program
            best_program = None
            if self.database.best_program_id:
                best_program = self.database.get(self.database.best_program_id)
                logger.info(f"Using tracked best program: {self.database.best_program_id}")

            if best_program is None:
                best_program = self.database.get_best_program()
                logger.info("Using calculated best program (tracked program not found)")

            if best_program:
                if (
                    hasattr(self, "parallel_controller")
                    and self.parallel_controller
                    and self.parallel_controller.early_stopping_triggered
                ):
                    logger.info(
                        f"🛑 Evolution complete via early stopping. Best program has metrics: "
                        f"{format_metrics_safe(best_program.metrics)}"
                    )
                else:
                    logger.info(
                        f"Evolution complete. Best program has metrics: "
                        f"{format_metrics_safe(best_program.metrics)}"
                    )
                best_paths = self._save_best_program(best_program)
                wall_clock_time_sec = (
                    time.time() - self._run_started_at if self._run_started_at else None
                )
                summary = self._write_summary(
                    best_program=best_program,
                    wall_clock_time_sec=wall_clock_time_sec,
                )
                self.wandb_logger.update_summary(
                    {
                        "best_fitness": summary["best_fitness"],
                        "best_iteration": summary["best_iteration"],
                        "total_iterations": summary["total_iterations"],
                        "wall_clock_time_sec": summary["wall_clock_time_sec"],
                    }
                )
                self.wandb_logger.log_file_artifact(
                    summary["summary_path"],
                    artifact_name="final-summary",
                    artifact_type="summary",
                    metadata={
                        "best_fitness": summary["best_fitness"],
                        "total_iterations": summary["total_iterations"],
                    },
                )
                if best_paths:
                    self.wandb_logger.log_best_program_artifact(
                        best_paths["code_path"],
                        metadata={
                            "iteration": best_program.iteration_found,
                            "fitness": summary["best_fitness"],
                            "metrics": flatten_scalars(best_program.metrics),
                            "program_id": best_program.id,
                        },
                    )
                return best_program

            logger.warning("No valid programs found during evolution")
            summary = self._write_summary(
                best_program=None,
                wall_clock_time_sec=(
                    time.time() - self._run_started_at if self._run_started_at else None
                ),
            )
            self.wandb_logger.update_summary(summary)
            return None
        finally:
            self.wandb_logger.finish()

    def _log_iteration(
        self,
        iteration: int,
        parent: Program,
        child: Program,
        elapsed_time: float,
    ) -> None:
        """
        Log iteration progress

        Args:
            iteration: Iteration number
            parent: Parent program
            child: Child program
            elapsed_time: Elapsed time in seconds
        """
        # Calculate improvement using safe formatting
        improvement_str = format_improvement_safe(parent.metrics, child.metrics)

        logger.info(
            f"Iteration {iteration+1}: Child {child.id} from parent {parent.id} "
            f"in {elapsed_time:.2f}s. Metrics: "
            f"{format_metrics_safe(child.metrics)} "
            f"(Δ: {improvement_str})"
        )

    def _save_checkpoint(self, iteration: int) -> None:
        """
        Save a checkpoint

        Args:
            iteration: Current iteration number
        """
        checkpoint_dir = os.path.join(self.output_dir, "checkpoints")
        os.makedirs(checkpoint_dir, exist_ok=True)

        # Create specific checkpoint directory
        checkpoint_path = os.path.join(checkpoint_dir, f"checkpoint_{iteration}")
        os.makedirs(checkpoint_path, exist_ok=True)

        # Save the database
        self.database.save(checkpoint_path, iteration)

        # Save the best program found so far
        best_program = None
        if self.database.best_program_id:
            best_program = self.database.get(self.database.best_program_id)
        else:
            best_program = self.database.get_best_program()

        if best_program:
            # Save the best program at this checkpoint
            best_program_path = os.path.join(checkpoint_path, f"best_program{self.file_extension}")
            with open(best_program_path, "w") as f:
                f.write(best_program.code)

            # Save metrics
            best_program_info_path = os.path.join(checkpoint_path, "best_program_info.json")
            with open(best_program_info_path, "w") as f:
                import json

                json.dump(
                    {
                        "id": best_program.id,
                        "generation": best_program.generation,
                        "iteration": best_program.iteration_found,
                        "current_iteration": iteration,
                        "metrics": best_program.metrics,
                        "language": best_program.language,
                        "timestamp": best_program.timestamp,
                        "saved_at": time.time(),
                    },
                    f,
                    indent=2,
                )

            logger.info(
                f"Saved best program at checkpoint {iteration} with metrics: "
                f"{format_metrics_safe(best_program.metrics)}"
            )

        logger.info(f"Saved checkpoint at iteration {iteration} to {checkpoint_path}")
        self.wandb_logger.log_checkpoint_artifact(
            checkpoint_path,
            metadata={
                "iteration": iteration,
                "best_program_id": best_program.id if best_program else None,
            },
        )

    def _load_checkpoint(self, checkpoint_path: str) -> None:
        """Load state from a checkpoint directory"""
        if not os.path.exists(checkpoint_path):
            raise FileNotFoundError(f"Checkpoint directory {checkpoint_path} not found")

        logger.info(f"Loading checkpoint from {checkpoint_path}")
        self.database.load(checkpoint_path)
        logger.info(f"Checkpoint loaded successfully (iteration {self.database.last_iteration})")

    async def _run_evolution_with_checkpoints(
        self, start_iteration: int, max_iterations: int, target_score: Optional[float]
    ) -> None:
        """Run evolution with checkpoint saving support"""
        logger.info(f"Using island-based evolution with {self.config.database.num_islands} islands")
        self.database.log_island_status()

        # Run the evolution process with checkpoint callback
        await self.parallel_controller.run_evolution(
            start_iteration, max_iterations, target_score, checkpoint_callback=self._save_checkpoint
        )

        # Check if shutdown or early stopping was triggered
        if self.parallel_controller.shutdown_event.is_set():
            logger.info("Evolution stopped due to shutdown request")
            return
        elif self.parallel_controller.early_stopping_triggered:
            logger.info("Evolution stopped due to early stopping - saving final checkpoint")
            # Continue to save final checkpoint for early stopping

        # Save final checkpoint if needed
        # Note: start_iteration here is the evolution start (1 for fresh start, not 0)
        # max_iterations is the number of evolution iterations to run
        final_iteration = start_iteration + max_iterations - 1
        if final_iteration > 0 and final_iteration % self.config.checkpoint_interval == 0:
            self._save_checkpoint(final_iteration)

    def _save_best_program(self, program: Optional[Program] = None) -> Optional[Dict[str, str]]:
        """
        Save the best program

        Args:
            program: Best program (if None, uses the tracked best program)
        """
        # If no program is provided, use the tracked best program from the database
        if program is None:
            if self.database.best_program_id:
                program = self.database.get(self.database.best_program_id)
            else:
                # Fallback to calculating best program if no tracked best program
                program = self.database.get_best_program()

        if not program:
            logger.warning("No best program found to save")
            return None

        best_dir = os.path.join(self.output_dir, "best")
        os.makedirs(best_dir, exist_ok=True)

        # Use the extension from the initial program file
        filename = f"best_program{self.file_extension}"
        code_path = os.path.join(best_dir, filename)

        with open(code_path, "w") as f:
            f.write(program.code)

        # Save complete program info including metrics
        info_path = os.path.join(best_dir, "best_program_info.json")
        with open(info_path, "w") as f:
            json.dump(
                {
                    "id": program.id,
                    "generation": program.generation,
                    "iteration": program.iteration_found,
                    "timestamp": program.timestamp,
                    "parent_id": program.parent_id,
                    "metrics": program.metrics,
                    "language": program.language,
                    "saved_at": time.time(),
                },
                f,
                indent=2,
            )

        logger.info(f"Saved best program to {code_path} with program info to {info_path}")
        return {"code_path": code_path, "info_path": info_path}
