# sk-d745b628b82547bf8e6ad02d531b50ed

# Please install OpenAI SDK first: `pip3 install openai`

from openai import OpenAI
import json

client = OpenAI(api_key="sk-d745b628b82547bf8e6ad02d531b50ed", base_url="https://api.deepseek.com")

with open('result1/llama3_true.json', "r", encoding="utf-8") as json_file:
    result = json.load(json_file)

scores = 0
ii = 0
for file_name in result:
    file1 = result[file_name]
    for person_id in file1:
        for model_name in file1[person_id]:
            q_a_id_list = file1[person_id][model_name]
            for id in q_a_id_list:
                q_a_id = q_a_id_list[id]
                question = q_a_id[0][2:]
                text1    = q_a_id[1][2:]
                text2    = q_a_id[2][12:]

                response = client.chat.completions.create(
                    model="deepseek-chat",
                    messages=[
                        {"role": "system", "content": "You are a helpful assistant"},
                        {"role": "user", "content": f"The known question is: {question}. The original answer is: {text1}. The target answer is: {text2}. Please provide a score for the original answer based on the following criteria: 1-2 are irrelevant and seriously incorrect; 3-4 are minor errors with low quality; 5-6 indicates medium quality; 7-8 indicates a quality similar to the target answer, while 9-10 indicates that the original answer is the target answer. Please provide numbers from 0 to 10 directly and do not give any other tokens:"},
                    ],
                    stream=False
                )
                scores += int(response.choices[0].message.content)
                ii += 1

print(f'scores: {scores}')
print('\n')
print(f'ii: {ii}')
print('\n')
print(f'avg scores: {scores / ii}')