import json
import os
from openai import OpenAI
from tqdm import tqdm

os.environ["OPENAI_API_KEY"] = "YOUR_API_KEY"
client = OpenAI(api_key=os.environ.get("OPENAI_API_KEY")) # Initialize the OpenAI client

# Define a function to run inference on the model
def run_inference(model, response):
    prompt = f"I am providing you a response from a model to a physics problem, termed 'Model Response'. You should extract the answer from the response. Directly output the extracted answer with no explanation. \n\nModel Response:{response}\n"
    # Run the model on the prompt
    response = client.chat.completions.create(
        model=model,
        messages=[
            {"role": "system", "content": "You are a expert assistant for extract final answer from a solution of problem."},
            {"role": "user", "content": prompt}
        ]
    )
    # Extract the response from the
    response = response.choices[0].message.content.strip()
    return response

# Load the JSON file containing the questions and input
with open('', 'r') as file:
    data = json.load(file)

save_results = []
# Iterate through each response in the JSON file
for idx, item in enumerate(tqdm(data, desc="Evaluating responses")):
    response = item['response']

    # Evaluate the model's response
    response = run_inference("gpt-4", response)
    print(response)

    # Save the evaluation result
    item['extracted_answer'] = response
    save_results.append(item)

    # Save the results every 10 responses
    if (idx+1) % 10 == 0:
        # Read existing results from the file, if it exists
        existing_results = []
        with open('', 'r') as file:
            existing_results = json.load(file)
        # Append the new results to the existing results
        for i in save_results:
            existing_results.append(i)
        # Save the results to the file
        with open('', 'w') as file:
            json.dump(existing_results, file, indent=4)
        save_results = []




