from typing import Optional, Tuple, List
import logging
from pathlib import Path
from shinka.database import Program
from shinka.llm import LLMClient
from shinka.prompts import NOVELTY_SYSTEM_MSG, NOVELTY_USER_MSG

logger = logging.getLogger(__name__)


class NoveltyJudge:
    

    def __init__(
        self,
        novelty_llm_client: Optional[LLMClient] = None,
        language: str = "python",
        similarity_threshold: float = 1.0,
        max_novelty_attempts: int = 3,
    ):
        self.novelty_llm_client = novelty_llm_client
        self.language = language
        self.similarity_threshold = similarity_threshold
        self.max_novelty_attempts = max_novelty_attempts

    def should_check_novelty(
        self,
        code_embedding: List[float],
        generation: int,
        parent_program: Optional[Program],
        database,
    ) -> bool:
        
        if not code_embedding or generation == 0 or not parent_program:
            return False

        
        if (
            parent_program.island_idx is not None
            and hasattr(database, "island_manager")
            and database.island_manager is not None
            and hasattr(database.island_manager, "are_all_islands_initialized")
            and database.island_manager.are_all_islands_initialized()
        ):
            return True

        return False

    def assess_novelty_with_rejection_sampling(
        self,
        exec_fname: str,
        code_embedding: List[float],
        parent_program: Program,
        database,
    ) -> Tuple[bool, dict]:
        
        novelty_metadata = {
            "novelty_checks_performed": 0,
            "novelty_total_cost": 0.0,
            "novelty_explanation": "",
            "max_similarity": 0.0,
            "similarity_scores": [],
        }

        for attempt in range(self.max_novelty_attempts):
            
            similarity_scores = database.compute_similarity(
                code_embedding, parent_program.island_idx
            )

            if not similarity_scores:
                logger.info(
                    f"NOVELTY CHECK {attempt + 1}/{self.max_novelty_attempts}: "
                    "Accepting program due to no similarity scores."
                )
                novelty_metadata["similarity_scores"] = []
                return True, novelty_metadata

            max_similarity = max(similarity_scores)
            sorted_similarity_scores = sorted(similarity_scores, reverse=True)
            formatted_similarities = [f"{s:.2f}" for s in sorted_similarity_scores]

            logger.info(f"Top-5 similarity scores: {formatted_similarities[:5]}")

            novelty_metadata["max_similarity"] = max_similarity
            novelty_metadata["similarity_scores"] = similarity_scores

            if max_similarity <= self.similarity_threshold:
                logger.info(
                    f"NOVELTY CHECK {attempt + 1}/{self.max_novelty_attempts}: "
                    f"Accepting program due to low similarity "
                    f"({max_similarity:.3f} <= {self.similarity_threshold})"
                )
                return True, novelty_metadata

            
            should_reject = True
            novelty_cost = 0.0

            if self.novelty_llm_client is not None:
                
                most_similar_program = database.get_most_similar_program(
                    code_embedding, parent_program.island_idx
                )

                if most_similar_program:
                    try:
                        
                        proposed_code = Path(exec_fname).read_text(encoding="utf-8")
                        is_novel, explanation, cost = self.check_llm_novelty(
                            proposed_code, most_similar_program
                        )
                        should_reject = not is_novel
                        novelty_cost = cost
                        novelty_metadata["novelty_checks_performed"] += 1
                        novelty_metadata["novelty_total_cost"] += cost
                        novelty_metadata["novelty_explanation"] = explanation
                    except Exception as e:
                        logger.warning(f"Error reading code for novelty check: {e}")
                        should_reject = True  

            if should_reject:
                logger.info(
                    f"NOVELTY CHECK {attempt + 1}/{self.max_novelty_attempts}: "
                    f"Rejecting program due to high similarity "
                    f"({max_similarity:.3f} > {self.similarity_threshold})"
                    + (
                        f" and LLM novelty check (cost: {novelty_cost:.4f})"
                        if novelty_cost > 0
                        else ""
                    )
                    + ". Retrying with different parent/inspirations."
                )
                
                continue
            else:
                logger.info(
                    f"NOVELTY CHECK {attempt + 1}/{self.max_novelty_attempts}: "
                    f"Accepting program despite high similarity "
                    f"({max_similarity:.3f} > {self.similarity_threshold}) "
                    f"due to LLM novelty check (cost: {novelty_cost:.4f})."
                )
                return True, novelty_metadata

        
        logger.info(
            f"NOVELTY CHECK: Exhausted all {self.max_novelty_attempts} attempts, "
            "rejecting program."
        )
        return False, novelty_metadata

    def check_llm_novelty(
        self, proposed_code: str, most_similar_program: Program
    ) -> Tuple[bool, str, float]:
        
        if not self.novelty_llm_client:
            logger.debug("Novelty LLM not configured, skipping novelty check")
            return True, "No novelty LLM configured", 0.0

        user_msg = NOVELTY_USER_MSG.format(
            language=self.language,
            existing_code=most_similar_program.code,
            proposed_code=proposed_code,
        )

        try:
            response = self.novelty_llm_client.query(
                msg=user_msg,
                system_msg=NOVELTY_SYSTEM_MSG,
                llm_kwargs=self.novelty_llm_client.get_kwargs(),
            )

            if response is None or response.content is None:
                logger.warning("Novelty LLM returned empty response")
                return True, "LLM response was empty", 0.0

            content = response.content.strip()
            api_cost = response.cost or 0.0

            
            is_novel = content.upper().startswith(
                "NOVEL"
            ) or content.upper().startswith("**NOVEL**")
            explanation = content
            return is_novel, explanation, api_cost

        except Exception as e:
            logger.error(f"Error in novelty LLM check: {e}")
            return True, f"Error in novelty check: {e}", 0.0

    def log_novelty_skip_message(self, reason: str) -> None:
        
        logger.info(f"NOVELTY CHECK: Skipping rejection sampling - {reason}")
