from typing import List
from collections import Counter
import re

def program_judge_11(query: str, response: str) -> dict:
    """
    Judges the quality of the response based on its verbosity and redundancy.
    Higher scores are given to responses which are verbose but not redundant.
    """
    try:
        # Remove punctuation and convert to lowercase
        response = re.sub(r'[^\w\s]', '', response).lower()
        words = response.split()

        # Count the frequency of each word
        word_counts = Counter(words)

        # Count the number of unique words and total words
        unique_word_count = len(word_counts)
        total_word_count = len(words)

        # Calculate verbosity - longer responses with more unique words score higher
        verbosity = unique_word_count / total_word_count

        # Calculate redundancy - responses with a high frequency of repeated words score lower
        redundancy = sum(count for word, count in word_counts.items() if count > 1) / total_word_count

        # Final score is a balance between verbosity and redundancy
        score = 10 * (verbosity - redundancy)

        # Ensure score is within 0-10 range
        score = max(0, min(score, 10))

        reasoning = f"Response has a verbosity score of {verbosity} and a redundancy score of {redundancy}."

        return {
            'score': score,
            'reasoning': reasoning,
            'criteria': "Response Verbosity/Redundancy"
        }
    except Exception as e:
        return {
            'score': 0.0,
            'reasoning': f"Error in evaluation: {str(e)}",
            'criteria': "Error occurred"
        }