"""
Common English words for the n vs KL/JS experiment.
Uses Google's 10,000 most common English words (no swears).
"""

import random
from fractions import Fraction
from pathlib import Path


def load_google_words():
    """Load words from the Google 10,000 English words file."""
    current_dir = Path(__file__).parent
    words_file = current_dir / "google-10000-english-no-swears.txt"

    with open(words_file, "r", encoding="utf-8") as f:
        words = [line.strip() for line in f if line.strip()]

    return words


# Load the words once when the module is imported
COMMON_WORDS = load_google_words()


def get_words_for_n(n: int) -> list[str]:
    """Get the first n words from the common words list."""
    if n > len(COMMON_WORDS):
        raise ValueError(f"Requested {n} words but only {len(COMMON_WORDS)} available")
    random.shuffle(COMMON_WORDS)
    return COMMON_WORDS[:n]


def get_uniform_probabilities(n: int) -> list[str]:
    """Get uniform probabilities for n words as strings to avoid floating point errors."""
    # Use Fraction to get exact representation, then convert to string
    prob_fraction = Fraction(1, n)
    prob_str = str(prob_fraction)
    return [prob_str] * n
