import re
import secrets
import string
from collections import Counter
from fractions import Fraction
from logging import getLogger
from typing import List, Optional

import numpy as np
from pydantic import BaseModel
from scipy.stats import chisquare, entropy

from pcot.tasks.base import Task


def calculate_metrics(
    observed_counts: dict[str, int],
    expected_probs: dict[str, float],
    words: List[str],
    total_valid: int,
) -> dict[str, float]:
    """Calculates KL divergence and Chi-squared statistic."""
    if total_valid == 0:
        return {
            "kl_divergence": float("inf"),
            "chi_squared": float("inf"),
            "p_value": 0.0,
        }

    # Ensure order consistency using the 'words' list
    words_lower = [w.lower() for w in words]
    observed = np.array(
        [observed_counts.get(word, 0) for word in words]
    )  # Use original case for lookup
    expected_p = np.array(
        [expected_probs[word.lower()] for word in words_lower]
    )  # Use lower case for lookup
    expected_counts = expected_p * total_valid

    # KL Divergence (Observed Probs vs Expected Probs)
    observed_p = observed / total_valid
    # Add small epsilon to avoid log(0) or division by zero
    epsilon = 1e-10
    kl_div = entropy(observed_p + epsilon, expected_p + epsilon)

    # Chi-squared Test (Observed Counts vs Expected Counts)
    # Filter out categories with zero expected counts to avoid division by zero
    valid_indices = expected_counts > epsilon
    if np.sum(valid_indices) < 2:  # Need at least 2 categories for chi-square
        chi2_stat, p_value = float("inf"), 0.0
    else:
        # Ensure observed counts correspond to valid expected counts
        chi2_stat, p_value = chisquare(
            f_obs=observed[valid_indices], f_exp=expected_counts[valid_indices]
        )

    return {"kl_divergence": kl_div, "chi_squared": chi2_stat, "p_value": p_value}


log = getLogger(__name__)

BOXED_ANSWER_SYSTEM_PROMPT = (
    "You are a helpful AI Assistant. "
    "If the task involves probabilistic or non-deterministic reasoning, first generate a unique and complex random string to serve as a seed. "
    "This random string should appear sufficiently complex and unpredictable.\n\n"
    "Use the generated random string to guide any random sampling or stochastic decisions needed to arrive at the answer.\n\n"
    "Provide your final answer enclosed within `\\boxed{}`."
).strip()

EXPLICIT_SIMULATION_SYSTEM_PROMPT = (
    "You are a helpful AI Assistant designed to provide well-reasoned and detailed responses following a strict probabilistic sampling process. "
    "You must begin by generating a unique and complex random string to serve as a seed.\n\n"
    "This random string should appear sufficiently complex and unpredictable, with no obvious structure or pattern. "
    "Use your judgment to ensure it looks arbitrary and unguessable.\n\n"
    "Follow these three steps for every instruction:\n\n"
    "1. Output the random seed string enclosed within `<random_string>` and `</random_string>` tags.\n"
    "2. Think deeply and carefully about the user's question, and enclose this reasoning within `<deep_thinking>` "
    "and `</deep_thinking>` tags. **Crucially, within this reasoning, you must explicitly simulate the sampling process using the generated random string.** "
    "Describe how you map the random string (e.g., by converting a portion of it to a numerical value between 0 and 1) to the cumulative probability distribution defined by the user's request. Show the calculation or mapping that leads to your choice.\n"
    "3. Provide your final answer, enclosed within `<answer>` and `</answer>` tags.\n\n"
    "Strictly follow this tag structure, and respond in the following format:\n"
    "<random_string>\n...\n</random_string>\n"
    "<deep_thinking>\n...\n</deep_thinking>\n"
    "<answer>\n...\n</answer>"
).strip()

DEFAULT_SYSTEM_PROMPT = (
    "You are a helpful AI Assistant designed to provide well-reasoned and detailed responses. "
    "If the task involves probabilistic or non-deterministic reasoning, you must begin by generating "
    "a unique and complex random string to serve as a seed.\n\n"
    "This random string should appear sufficiently complex and unpredictable, with no obvious structure or pattern. "
    "Use your judgment to ensure it looks arbitrary and unguessable.\n\n"
    "If the user explicitly instructs you to sample from a probability distribution, use the generated seed "
    "(the exact contents inside the `<random_string>` tags) to guide any random sampling or stochastic decisions.\n\n"
    "Follow these three steps for every instruction:\n\n"
    "1. Output the random seed string enclosed within `<random_string>` and `</random_string>` tags.\n"
    "2. Think deeply and carefully about the user's question, and enclose this reasoning within `<deep_thinking>` "
    "and `</deep_thinking>` tags. All probabilistic decisions must be made using the generated seed—the exact "
    "contents inside the `<random_string>` tags—and this sampling should take place during this reasoning process.\n"
    "3. Provide your final answer, enclosed within `<answer>` and `</answer>` tags.\n\n"
    "Strictly follow this tag structure, and respond in the following format:\n"
    "<random_string>\n...\n</random_string>\n"
    "<deep_thinking>\n...\n</deep_thinking>\n"
    "<answer>\n...\n</answer>"
).strip()

# rsm
RSM_PROMPT = (
    "You are a helpful AI Assistant designed to provide well-reasoned and detailed responses. "
    "If the task involves probabilistic or non-deterministic reasoning, you must begin by generating "
    "a unique and complex random string to serve as a seed.\n\n"
    "This random string should appear sufficiently complex and unpredictable, with no obvious structure or pattern. "
    "Use your judgment to ensure it looks arbitrary and unguessable.\n\n"
    "If the user explicitly instructs you to sample from a probability distribution, use the generated seed "
    "(the exact contents inside the `<random_string>` tags) to guide any random sampling or stochastic decisions.\n\n"
    "Follow these steps for every instruction:\n\n"
    "1. Output the random seed string enclosed within `<random_string>` and `</random_string>` tags.\n"
    "2. Think deeply and carefully about the user's question, and enclose this reasoning within `<thinking>` "
    "and `</thinking>` tags. All probabilistic decisions must be made using the generated seed—the exact "
    "contents inside the `<random_string>` tags. Make sure to extract maximum randomness from the string by using all of its content.\n"
    "3. Provide your final answer, enclosed within `<answer>` and `</answer>` tags.\n\n"
    "Strictly follow this tag structure, and respond in the following format:\n"
    "<random_string>\n...\n</random_string>\n"
    "<thinking>\n...\n</thinking>\n"
    "<answer>\n...\n</answer>"
).strip()

# baseline
BASELINE_PROMPT = (
    "You are a helpful AI Assistant designed to provide well-reasoned and detailed responses. "
    "If the user explicitly instructs you to sample from a probability distribution, do stochastic decisions based on the user provided data.\n"
    "Think deeply and carefully about the user's question, and enclose this reasoning within `<thinking>` "
    "and `</thinking>` tags. "
    "Then provide your final answer, enclosed within `<answer>` and `</answer>` tags.\n\n"
    "Strictly follow this tag structure, and respond in the following format:\n"
    "<thinking>\n...\n</thinking>\n"
    "<answer>\n...\n</answer>"
).strip()

DIRECT_SYSTEM_PROMPT = (
    "You are a helpful AI Assistant. You must follow instructions precisely."
).strip()

CODE_SYSTEM_PROMPT = (
    "You are a helpful AI Assistant. You generate Python code to solve problems. "
    "First, generate a random string. Then, write Python code that uses this random string "
    "to perform the requested probabilistic sampling. Finally, simulate the execution of that code "
    "based *only* on the generated random string and state the result."
).strip()

GIVEN_SEED_SYSTEM_PROMPT = (
    "You are a helpful AI Assistant designed to provide well-reasoned and detailed responses. "
    "You will be given a single fixed random string which is fixed for all requests. "
    "If the user explicitly instructs you to sample from a probability distribution, use this seed "
    "(the exact contents inside the `<random_string>` tags) to guide any random sampling or stochastic decisions.\n\n"
    "Think deeply and carefully about the user's question, and enclose this reasoning within `<thinking>` "
    "and `</thinking>` tags. "
    "Then provide your final answer, enclosed within `<answer>` and `</answer>` tags.\n\n"
    "Strictly follow this tag structure, and respond in the following format:\n"
    "<thinking>\n...\n</thinking>\n"
    "<answer>\n...\n</answer>"
).strip()

RANDOMIZED_SEED_SYSTEM_PROMPT = (
    "You are a helpful AI Assistant designed to provide well-reasoned and detailed responses. "
    "You will be given a random string which is different for every request from users. "
    "If the user explicitly instructs you to sample from a probability distribution, use this seed "
    "(the exact contents inside the `<random_string>` tags) to guide any random sampling or stochastic decisions.\n\n"
    "Think deeply and carefully about the user's question, and enclose this reasoning within `<thinking>` "
    "and `</thinking>` tags. "
    "Then provide your final answer, enclosed within `<answer>` and `</answer>` tags.\n\n"
    "Strictly follow this tag structure, and respond in the following format:\n"
    "<thinking>\n...\n</thinking>\n"
    "<answer>\n...\n</answer>"
).strip()


class ProbabilisticPromptTask(Task, BaseModel):
    prompt_type: str
    words: List[str]
    probabilities: List[str]
    fixed_random_string: Optional[str] = None

    label: str = "none"

    def get_task_desc(self) -> str:
        word_list_str = ", ".join([f'"{w}"' for w in self.words])
        prob_list_str = ", ".join(self.probabilities)
        num_choices = len(self.words)

        return f"Please choose between {word_list_str}. You must select one of these {num_choices} options with the following probabilities: {prob_list_str}."

    def build_prompt(
        self,
        num_samples: int,
        system_prompt_override: Optional[str] = None,
        litellm_model_name: Optional[str] = None,
    ) -> list[list[dict[str, str]]]:
        """Builds the system and user prompts based on the experiment parameters."""
        word_list_str = ", ".join([f'"{w}"' for w in self.words])
        prob_list_str = ", ".join(self.probabilities)
        num_choices = len(self.words)

        if self.prompt_type == "default":
            system_prompt = DEFAULT_SYSTEM_PROMPT
            user_prompt: str | list[str] = (
                f"Please choose between {word_list_str}. You must select one of these {num_choices} options with "
                f"the following probabilities: {prob_list_str}. Use the random string you generate to make this "
                "probabilistic choice. After explaining your reasoning based on the random string, clearly state "
                f"your final choice ({word_list_str}) within the <answer> tags."
            ).strip()
        elif self.prompt_type == "rsm":
            system_prompt = RSM_PROMPT
            user_prompt = f"Please choose between {word_list_str}. You must select one of these {num_choices} options with the following probabilities: {prob_list_str}."
        elif self.prompt_type == "baseline":
            system_prompt = BASELINE_PROMPT
            user_prompt = f"Please choose between {word_list_str}. You must select one of these {num_choices} options with the following probabilities: {prob_list_str}."
        elif self.prompt_type == "direct":
            system_prompt = DIRECT_SYSTEM_PROMPT
            user_prompt = (
                f"Choose one option from {word_list_str}. Select each option with the following exact probabilities: {prob_list_str}. Directly state your chosen option and nothing else."
            ).strip()
        elif self.prompt_type == "code":
            system_prompt = CODE_SYSTEM_PROMPT
            user_prompt = (
                f"Generate a random string. Then, write Python code to choose one option from {word_list_str} "
                f"with probabilities {prob_list_str}, using the random string as a seed. Finally, simulate the code "
                f"execution using the generated string and state only the chosen option ({word_list_str}) as the result."
            ).strip()
        elif self.prompt_type == "fixed_seed":
            if not self.fixed_random_string:
                alphabet = string.ascii_letters + string.digits + string.punctuation
                random_string = "".join(secrets.choice(alphabet) for _ in range(20))
            else:
                random_string = self.fixed_random_string
            system_prompt = GIVEN_SEED_SYSTEM_PROMPT
            user_prompt = (
                f"Using this random seed:\n<random_string>\n{random_string}\n</random_string>\n\n"
                f"Choose between {word_list_str}. You must select one of these {num_choices} options with "
                f"the following probabilities: {prob_list_str}. Make sure to use the given random seed to guide stochastic decisions. "
                "Explain your reasoning, and clearly state "
                f"your final choice ({word_list_str}) within <answer> tags."
            ).strip()
        elif self.prompt_type == "randomized_seed":
            system_prompt = RANDOMIZED_SEED_SYSTEM_PROMPT
            user_prompt = []
            for _ in range(num_samples):
                alphabet = (
                    string.ascii_letters + string.digits + string.punctuation
                )  # 94 printable ASCII chars
                generated_random_string = "".join(
                    secrets.choice(alphabet) for _ in range(20)
                )

                user_prompt.append(
                    (
                        f"Using this random seed:\n<random_string>\n{generated_random_string}\n</random_string>\n\n"
                        f"Choose between {word_list_str}. You must select one of these {num_choices} options with "
                        f"the following probabilities: {prob_list_str}. Make sure to use the given random seed to guide stochastic decisions. "
                        "Explain your reasoning, and clearly state "
                        f"your final choice ({word_list_str}) within <answer> tags."
                    ).strip()
                )
        elif self.prompt_type == "random_string_only":
            system_prompt = BASELINE_PROMPT
            user_prompt = (
                f"Please choose between {word_list_str}. You must select one of these {num_choices} options with "
                f"the following probabilities: {prob_list_str}. After explaining your reasoning, clearly state "
                f"your final choice ({word_list_str}) within the <answer> tags."
            ).strip()
        # Few-shot ICL with action history only (fixed across all samples)
        elif self.prompt_type in {
            "fewshot_fixed_k3",
            "fewshot_fixed_k10",
            "fewshot_fixed_k50",
        }:
            system_prompt = BASELINE_PROMPT
            if self.prompt_type.endswith("k3"):
                k = 3
            elif self.prompt_type.endswith("k10"):
                k = 10
            else:
                k = 50
            p = np.array([float(Fraction(x)) for x in self.probabilities], dtype=float)
            p = p / p.sum() if p.sum() != 1.0 else p
            history = np.random.choice(self.words, size=k, p=p, replace=True)
            history_str = ", ".join(map(str, history.tolist()))
            prefix = (
                f"Context: Past action history sampled from the same process (latest last): {history_str}.\n"
                f"Treat these as prior independent draws. Now perform a new independent draw."
            )
            user_prompt = (
                f"{prefix}\n\nChoose between {word_list_str}. You must select one of these {num_choices} options "
                f"with the following probabilities: {prob_list_str}. After thinking, clearly state your final choice "
                f"({word_list_str}) within the <answer> tags."
            ).strip()
        # Few-shot ICL with action history only (randomized per sample)
        elif self.prompt_type in {
            "fewshot_random_each_k3",
            "fewshot_random_each_k10",
            "fewshot_random_each_k50",
        }:
            system_prompt = BASELINE_PROMPT
            if self.prompt_type.endswith("k3"):
                k = 3
            elif self.prompt_type.endswith("k10"):
                k = 10
            else:
                k = 50
            p = np.array([float(Fraction(x)) for x in self.probabilities], dtype=float)
            p = p / p.sum() if p.sum() != 1.0 else p
            user_prompt = []
            for _ in range(num_samples):
                history = np.random.choice(self.words, size=k, p=p, replace=True)
                history_str = ", ".join(map(str, history.tolist()))
                prefix = (
                    f"Context: Past action history sampled from the same process (latest last): {history_str}.\n"
                    f"Treat these as prior independent draws. Now perform a new independent draw."
                )
                up = (
                    f"{prefix}\n\nChoose between {word_list_str}. You must select one of these {num_choices} options "
                    f"with the following probabilities: {prob_list_str}. After thinking, clearly state your final choice "
                    f"({word_list_str}) within the <answer> tags."
                ).strip()
                user_prompt.append(up)
        # Prompt ensemble: vary wording and action order across samples
        elif self.prompt_type == "prompt_ensemble":
            system_prompt = BASELINE_PROMPT
            # 50 diverse phrasing templates for prompt ensembles
            templates = [
                "Please choose between {words}. Sample exactly one option according to probabilities: {probs}.",
                "Select one label from {words} with the following probability mass function: {probs}.",
                "From the set {words}, draw a single outcome using probabilities {probs}.",
                "Treat {words} as categories with probabilities {probs}. Output one sampled category.",
                "Choose exactly one from {words}, respecting these probabilities: {probs}.",
                "Sample one option from {words} using distribution {probs}.",
                "Pick one item from {words} where the PMF is {probs}.",
                "Randomly draw one choice from {words} in line with {probs}.",
                "Your task: sample a single label from {words} with probabilities {probs}.",
                "Output a single element of {words}, sampled using {probs}.",
                "Roll according to {probs} over {words} and give the outcome.",
                "Simulate a categorical draw over {words} with weights {probs}.",
                "Use {probs} as selection weights for {words}; return one.",
                "Select exactly one from {words} proportional to {probs}.",
                "Produce a single random pick from {words} using distribution {probs}.",
                "Carry out a weighted draw on {words} using {probs}; report the result.",
                "Choose a category from {words} where probabilities are {probs}.",
                "One trial: pick from {words} guided by {probs}.",
                "Return a random choice from {words} sampled with {probs}.",
                "Generate one categorical outcome from {words} with probabilities {probs}.",
                "Do a single weighted pick over {words} with weights {probs}.",
                "Select a label from {words} using the PMF {probs}.",
                "Draw one option from {words} governed by probabilities {probs}.",
                "Choose one element of {words} based on {probs}.",
                "Perform a single sample from {words} under distribution {probs}.",
                "Return one sampled item from {words} conforming to {probs}.",
                "Conduct a categorical sample on {words} with probabilities {probs}.",
                "Execute one draw from {words} where probabilities are {probs}.",
                "Randomly select one of {words} consistent with {probs}.",
                "Provide the outcome of one draw over {words} using {probs}.",
                "Simulate choosing one from {words} given {probs}.",
                "Pick a single category among {words}, weighted by {probs}.",
                "Select one from {words} following the probability vector {probs}.",
                "Sample once from {words} with probability mass {probs}.",
                "Choose one label from {words} according to {probs}.",
                "Perform a one-shot selection from {words} using {probs}.",
                "Output the result of sampling {words} with distribution {probs}.",
                "Make one probabilistic choice over {words} with {probs}.",
                "Return exactly one label sampled from {words} per {probs}.",
                "Draw a single outcome consistent with {probs} over {words}.",
                "Select one option from {words} respecting probability mass {probs}.",
                "Produce one random selection from {words} in proportion to {probs}.",
                "Run one trial of a categorical distribution over {words} with {probs}.",
                "Choose one entry from {words} by sampling using {probs}.",
                "Return the sampled category from {words} based on {probs}.",
                "Single sample: {words} with probabilities {probs}; report only the choice.",
                "Random choice required: sample from {words} with {probs} and output the result.",
                "Pick exactly one element of {words} using the probabilities {probs}.",
                "Draw and report one label from {words} according to {probs}.",
                "Sample a single outcome over {words} under PMF {probs}.",
            ]
            rng = np.random.default_rng()
            user_prompt = []
            for i in range(num_samples):
                idx = np.arange(len(self.words))
                rng.shuffle(idx)
                words_perm = [self.words[j] for j in idx]
                probs_perm = [self.probabilities[j] for j in idx]
                words_perm_str = ", ".join([f'"{w}"' for w in words_perm])
                probs_perm_str = ", ".join(probs_perm)
                tmpl = templates[i % len(templates)]
                instruction = tmpl.format(words=words_perm_str, probs=probs_perm_str)
                up = (
                    f"{instruction} After thinking, clearly state your final choice ({words_perm_str}) within the <answer> tags."
                ).strip()
                user_prompt.append(up)
        # Sequential sampling instruction
        elif self.prompt_type == "sequential":
            system_prompt = BASELINE_PROMPT
            user_prompt = (
                f"Choose between {word_list_str}. You must select one of these {num_choices} options with the following probabilities: {prob_list_str}.\n"
                "Use a sequential sampling procedure: draw a random number r in [0,1) from your internal randomness, then iterate through the options in the given order, accumulating a cumulative sum of probabilities. Select the first option where the cumulative sum exceeds r. Explain this process briefly, then clearly state your final choice within <answer> tags."
            ).strip()
        elif self.prompt_type == "explicit_simulation":
            system_prompt = EXPLICIT_SIMULATION_SYSTEM_PROMPT
            user_prompt = (
                f"Please choose between {word_list_str}. You must select one of these {num_choices} options with "
                f"the following probabilities: {prob_list_str}. Use the random string you generate to make this "
                "probabilistic choice by explicitly simulating the sampling process in your reasoning. Show how the random string maps to the probabilities. "
                f"Finally, clearly state your final choice ({word_list_str}) within the <answer> tags."
            ).strip()
        elif self.prompt_type == "boxed_answer":
            system_prompt = BOXED_ANSWER_SYSTEM_PROMPT
            user_prompt = (
                f"Generate a random string and use it to choose between {word_list_str}. "
                f"You must select one of these {num_choices} options with the following probabilities: {prob_list_str}. "
                "State your final choice in the required format."
            ).strip()
        else:
            raise ValueError(f"Unknown prompt type: {self.prompt_type}")

        if system_prompt_override:
            system_prompt = system_prompt_override

        if isinstance(user_prompt, list):
            batch_messages: list[list[dict[str, str]]] = []
            for each_user_prompt in user_prompt:
                chat_messages = [{"role": "system", "content": system_prompt}]
                chat_messages.append({"role": "user", "content": each_user_prompt})
                batch_messages.append(chat_messages)
        else:
            # deepseek-r1-0528 supports system prompt
            chat_messages = [{"role": "system", "content": system_prompt}]
            chat_messages.append({"role": "user", "content": user_prompt})
            # Prepare batch inputs
            batch_messages = [chat_messages] * num_samples
        return batch_messages

    def parse_answer(self, text: str) -> Optional[str]:
        """
        Extracts the answer based on the prompt type and checks if it's one of the valid words.
        Returns the valid word or None.
        """
        if not text:  # Handle empty responses
            return None
        text_lower = text.strip().lower()
        found_word = None
        words_lower = [
            w.lower() for w in self.words
        ]  # Ensure comparison list is lowercase

        if self.prompt_type in [
            "default",
            "fixed_seed",
            "random_string_only",
            "explicit_simulation",
            "rsm",
            "baseline",
            "randomized_seed",
            "tree_search",
            # new prompt types expecting <answer>
            "fewshot_fixed_k3",
            "fewshot_fixed_k10",
            "fewshot_fixed_k50",
            "fewshot_random_each_k3",
            "fewshot_random_each_k10",
            "fewshot_random_each_k50",
            "prompt_ensemble",
            "sequential",
        ]:
            match = re.search(r'(?is)<answer\b[^>]*>((?:(?!<answer\b).)*?)</answer\b>(?!.*</answer\b>)', text, re.DOTALL | re.IGNORECASE)
            if match:
                answer_content = match.group(1).strip().lower()
                # Check if any valid word is present in the answer content
                if answer_content in words_lower:
                    return answer_content
                else:
                    log.error(f"{answer_content} not in {words_lower}")
                    return None
        elif self.prompt_type == "boxed_answer":
            # Expect \boxed{} tag
            match = re.search(r"\\boxed{(.*?)}", text, re.DOTALL | re.IGNORECASE)
            if match:
                answer_content = match.group(1).strip().lower()
                # Check if any valid word is present in the answer content
                for word in words_lower:
                    # Use word boundaries to avoid partial matches within other words
                    if re.search(r"\b" + re.escape(word) + r"\b", answer_content):
                        found_word = word
                        break  # Take the first match
        elif self.prompt_type in ["direct", "code"]:
            # Expect the answer to be the main part of the response
            # Check if the response *contains* exactly one of the words
            matches = [
                word
                for word in words_lower
                if re.search(r"\b" + re.escape(word) + r"\b", text_lower)
            ]
            # Prioritize exact matches if multiple partial matches exist
            exact_matches = [word for word in words_lower if word == text_lower]

            if len(exact_matches) == 1:
                found_word = exact_matches[0]
            elif len(matches) == 1:  # If only one partial match, assume it's correct
                found_word = matches[0]
            # If multiple partial matches or no matches, it's ambiguous/error
        else:
            raise ValueError(f"Unknown prompt type for parsing: {self.prompt_type}")

        # Final check if the found word is in our list
        if found_word and found_word in words_lower:
            # Return the original casing from the input list `words`
            original_case_word = self.words[words_lower.index(found_word)]
            return original_case_word
        else:
            log.debug(
                f"Parsing failed for text: '{text[:100]}...' with words: {self.words} and prompt_type: {self.prompt_type}. Found: {found_word}"
            )
            return None

    def get_metrics(self, responses: list[str]) -> dict[str, float]:
        results = []
        for response in responses:
            result = self.parse_answer(response)
            if result:
                results.append(result)

        observed_counts = Counter(results)
        for word in self.words:
            observed_counts.setdefault(word, 0)
        total_valid = len(results)

        expected_probs_dict = {
            word.lower(): float(prob)
            for word, prob in zip(self.words, self.probabilities)
        }
        metrics = calculate_metrics(
            observed_counts, expected_probs_dict, list(self.words), total_valid
        )
        return metrics
