import json, os, string
import subprocess

input_dir = "outputs_math_2class_cotmuchmore"
# input_single_f = "../ft_data/gpt4o/test/data_lvl_54321_greedy_4class.json"
input_single_f = "rationales_nl_1.jsonl"
input_f = os.path.join(input_dir, input_single_f)


def preprocess(input_f):
    with open(input_f, "r", encoding="utf-8") as f:
        try:
            data = json.load(f)
        except:
            data = ""
            pass
    dict_mapping = {
        # "cot": "Chain-of-Thought",
        # "PAL": "Program-aided language",
        # "NLCode": "Natural language "
    }
    # Ensure it's a list of dictionaries
    if isinstance(data, list):
        print(len(data))
        cot = 0
        pal = 0
        for entry in data:
            print(entry['label'])
            if "COT".lower() in entry['label']:
                cot += 1
            elif "PAL".lower() in entry['label']:
                pal += 1

        print(cot)
        print(pal)
    else:
        with open(input_f, "r", encoding="utf-8") as f:
            total = 0
            cot = 0
            pal = 0
            for e in f:
                entry = json.loads(e)
                total += 1
                # print(entry

                print(entry['messages'][0]['content'])
                method = entry['messages'][0]['content'].split("<Answer>\nSelected method:")[-1]
                # print(method)
                if "COT" in method:
                    cot += 1
                elif "PAL" in method:
                    pal += 1
        print(total)
        print(cot)
        print(pal)


preprocess(input_f)

