import nltk
from collections import Counter

def program_judge_8(query: str, response: str) -> dict:
    """
    Judges responses based on its verbosity or redundancy, 
    i.e., how much information is repeated or how verbose the response is.
    """
    try:
        # Tokenize the response into words
        words = nltk.word_tokenize(response)

        # Count the frequency of each word
        word_freq = Counter(words)

        # Find the total number of words and the number of unique words
        total_words = len(words)
        unique_words = len(word_freq.keys())

        # Calculate the redundancy ratio as (total words - unique words) / total words
        redundancy_ratio = (total_words - unique_words) / total_words

        # Higher redundancy_ratio means more redundant/verbose response, so score is lower
        # Scale the score to 0-10
        score = (1 - redundancy_ratio) * 10

        reasoning = "The response was evaluated based on its verbosity or redundancy. " \
                    "Responses that have more unique words receive higher scores as they " \
                    "are considered to be less verbose and redundant."
        criteria = "Response Verbosity/Redundancy"
        
        return {
            'score': score,
            'reasoning': reasoning,
            'criteria': criteria
        }
    except Exception as e:
        return {
            'score': 0.0,
            'reasoning': f"Error in evaluation: {str(e)}",
            'criteria': "Error occurred"
        }