from nltk.corpus import stopwords
from nltk.cluster.util import cosine_distance
import numpy as np

def program_judge_20(query: str, response: str) -> dict:
    """
    Judges responses based on their relevance to the query, using cosine similarity 
    to measure semantic similarity.
    """
    try:
        # Convert to lower case and remove stopwords
        stop_words = set(stopwords.words('english'))
        query = [word.lower() for word in query.split() if word not in stop_words]
        response = [word.lower() for word in response.split() if word not in stop_words]

        # Create a vector representation of sentences
        all_words = list(set(query + response))
        query_vector = [0] * len(all_words)
        response_vector = [0] * len(all_words)

        # Build the vector for the first sentence
        for word in query:
            query_vector[all_words.index(word)] += 1

        # Build the vector for the second sentence
        for word in response:
            response_vector[all_words.index(word)] += 1

        # Compute cosine similarity
        cosine_similarity = 1 - cosine_distance(query_vector, response_vector)

        # Scale the similarity score to 0-10
        score = cosine_similarity * 10
        reasoning = "The score is based on the cosine similarity between the query and the response."
        criteria = "Relevance to Query (Semantic Similarity)"

        return {
            'score': score,
            'reasoning': reasoning,
            'criteria': criteria
        }
    except Exception as e:
        return {
            'score': 0.0,
            'reasoning': f"Error in evaluation: {str(e)}",
            'criteria': "Error occurred"
        }