from collections import Counter
from logging import getLogger
from typing import Dict, List, Union

import numpy as np
import scipy.stats

log = getLogger(__name__)


def analyze_random_strings(
    strings: List[str],
) -> Dict[str, Union[int, float, Dict[str, int], str, None]]:
    """Performs basic analysis and randomness checks on the collected random strings."""
    # Re-included here for completeness, or could be moved to a shared utility module.
    analysis: Dict[str, Union[int, float, Dict[str, int], str, None]] = {}
    total_strings = len(strings)
    analysis["total_strings_collected"] = total_strings

    if total_strings == 0:
        analysis["unique_strings_count"] = 0
        analysis["average_length"] = 0.0
        analysis["min_length"] = 0
        analysis["max_length"] = 0
        analysis["char_frequency"] = {}
        analysis["shannon_entropy_chars"] = None
        analysis["average_run_length"] = None
        analysis["most_common_bigram"] = None
        analysis["most_common_bigram_freq"] = None
        return analysis

    unique_strings = set(strings)
    analysis["unique_strings_count"] = len(unique_strings)

    lengths = [len(s) for s in strings]
    analysis["average_length"] = (
        sum(lengths) / total_strings if total_strings > 0 else 0.0
    )
    analysis["min_length"] = min(lengths) if lengths else 0
    analysis["max_length"] = max(lengths) if lengths else 0

    all_chars = "".join(strings)
    total_chars = len(all_chars)

    char_counts = Counter(all_chars)
    analysis["char_frequency"] = dict(char_counts)
    if total_chars > 0:
        probabilities = [count / total_chars for count in char_counts.values()]
        try:
            entropy = scipy.stats.entropy(probabilities, base=2)
            analysis["shannon_entropy_chars"] = entropy
        except ImportError:
            log.warning("scipy.stats not found. Cannot calculate Shannon entropy.")
            analysis["shannon_entropy_chars"] = "Error: scipy not found"
        except Exception as e:
            log.warning(f"Could not calculate Shannon entropy: {e}")
            analysis["shannon_entropy_chars"] = f"Error: {e}"
    else:
        analysis["shannon_entropy_chars"] = None

    if total_chars > 0:
        runs = 0
        run_lengths_sum = 0
        if total_chars > 0:
            runs = 1
            current_run_length = 0
            for i in range(total_chars):
                current_run_length += 1
                if i + 1 == total_chars or all_chars[i] != all_chars[i + 1]:
                    run_lengths_sum += current_run_length
                    if i + 1 < total_chars:
                        runs += 1
                    current_run_length = 0
        analysis["average_run_length"] = run_lengths_sum / runs if runs > 0 else 0
    else:
        analysis["average_run_length"] = None

    if total_chars >= 2:
        bigrams = [all_chars[i : i + 2] for i in range(total_chars - 1)]
        if bigrams:
            bigram_counts = Counter(bigrams)
            if bigram_counts:
                most_common_bigram, count = bigram_counts.most_common(1)[0]
                analysis["most_common_bigram"] = most_common_bigram
                analysis["most_common_bigram_freq"] = count / len(bigrams)
            else:
                analysis["most_common_bigram"] = None
                analysis["most_common_bigram_freq"] = None
        else:
            analysis["most_common_bigram"] = None
            analysis["most_common_bigram_freq"] = None
    else:
        analysis["most_common_bigram"] = None
        analysis["most_common_bigram_freq"] = None

    return analysis


def analyze_random_integers(
    integers: List[int], min_value: int, max_value: int
) -> Dict[str, Union[int, float, Dict[int, int], str, None]]:  # Reverted type hint
    """Analyzes the distribution of the generated random integers."""
    analysis: Dict[
        str, Union[int, float, Dict[int, int], str, None]
    ] = {}  # Reverted type hint
    total_integers = len(integers)
    analysis["total_integers_parsed"] = total_integers

    if total_integers == 0:
        analysis["observed_integer_counts"] = {}
        analysis["min_generated_int"] = None
        analysis["max_generated_int"] = None
        analysis["mean_generated_int"] = None
        analysis["std_dev_generated_int"] = None
        analysis["chi_squared_uniformity"] = None
        analysis["p_value_uniformity"] = None
        return analysis

    observed_counts = Counter(integers)
    analysis["observed_integer_counts"] = dict(observed_counts)

    analysis["min_generated_int"] = min(integers)
    analysis["max_generated_int"] = max(integers)
    analysis["mean_generated_int"] = np.mean(integers)
    analysis["std_dev_generated_int"] = np.std(integers)
    return analysis
