from collections import Counter
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.metrics.pairwise import cosine_similarity

def program_judge_18(query: str, response: str) -> dict:
    """
    Judges responses based on verbosity and redundancy.
    The less verbose and redundant the response, the higher the score.
    """
    try:
        # Create the CountVectorizer object
        cv = CountVectorizer()

        # Generate the matrix from the text
        count_matrix = cv.fit_transform([query, response])

        # Compute the cosine similarity
        cosine_sim = cosine_similarity(count_matrix)

        # Calculate the verbosity/redundancy score based on the cosine similarity
        verbosity_score = (1 - cosine_sim[0][1]) * 10

        # Compute the word frequency in the response
        word_counts = Counter(response.split())

        # Calculate the redundancy score based on the frequency of words
        redundancy_score = (1 - len(word_counts) / len(response.split())) * 10

        # Total score is the average of verbosity and redundancy scores
        score = (verbosity_score + redundancy_score) / 2

        reasoning = f"The response was scored based on its verbosity and redundancy. The verbosity score (based on cosine similarity with the query) was {verbosity_score:.2f}, and the redundancy score (based on word repetition) was {redundancy_score:.2f}."
        
        criteria = "Response Verbosity/Redundancy"
        
        return {
            'score': float(f"{score:.2f}"),
            'reasoning': reasoning,
            'criteria': criteria
        }
    except Exception as e:
        return {
            'score': 0.0,
            'reasoning': f"Error in evaluation: {str(e)}",
            'criteria': "Error occurred"
        }