
import os
import shutil
import numpy as np
import time
import json
from transformers import GenerationConfig
import os

devices = [4]
d_str = ''
for d in devices:
    d_str += str(d) + ','
d_str = d_str[:-1]
os.environ["CUDA_VISIBLE_DEVICES"] = d_str

import torch
from torch.utils.data import DataLoader
USER_PATH = '/home/XXXX/home/XXXX/6_26_backup/fs_backup_feb13/'

os.environ["CURL_CA_BUNDLE"]=""
os.environ["REQUESTS_CA_BUNDLE"]=""
# os.environ['TRANSFORMERS_CACHE'] = USER_PATH + '/.cache/huggingface/hub'
cache_dir = '/work/XXXX'
os.environ['TRANSFORMERS_CACHE'] = cache_dir
os.environ['HF_HOME'] = cache_dir
# os.environ['HF_HUB_OFFLINE'] ='1'

# import transformers

# import urllib3
from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig
import argparse
from tqdm import tqdm
import time
import datetime
import warnings
import contextlib

import requests
from urllib3.exceptions import InsecureRequestWarning

old_merge_environment_settings = requests.Session.merge_environment_settings

@contextlib.contextmanager
def no_ssl_verification():
    opened_adapters = set()

    def merge_environment_settings(self, url, proxies, stream, verify, cert):
        # Verification happens only once per connection so we need to close
        # all the opened adapters once we're done. Otherwise, the effects of
        # verify=False persist beyond the end of this context manager.
        opened_adapters.add(self.get_adapter(url))

        settings = old_merge_environment_settings(self, url, proxies, stream, verify, cert)
        settings['verify'] = False

        return settings

    requests.Session.merge_environment_settings = merge_environment_settings

    try:
        with warnings.catch_warnings():
            warnings.simplefilter('ignore', InsecureRequestWarning)
            yield
    finally:
        requests.Session.merge_environment_settings = old_merge_environment_settings

        for adapter in opened_adapters:
            try:
                adapter.close()
            except:
                pass

class Struct:
    def __init__(self, **entries):
        self.__dict__.update(entries)

args = {'train_file_path': './example_data', 'test_file_path': './example_data', 'save_path': './../SFT_train_res', 'model_choice': 'Qwen/Qwen2.5-VL-32B-Instruct', 
        'n_rows': 20, 'max_length': 1000,'temperature': 1, 'lr': 5e-05, 'weight_decay': 0.0, 'epochs': 10, 'max_grad_norm': 1.0, 'batch_size': 2, 'save_strategy': 'no', 'use_lora': True}
# args['model_choice'] = 'meta-llama/Meta-Llama-3-70B-Instruct'
args['model_choice'] = 'meta-llama/Meta-Llama-3-8B-Instruct'

# args['model_choice'] = 'mistralai/Mistral-7B-Instruct-v0.3'

# args['model_choice'] = "Qwen/Qwen2.5-VL-32B-Instruct"
args = Struct(**args)

class LLM():
    def __init__(self):
        quant_config = BitsAndBytesConfig(
            load_in_4bit=True,
            bnb_4bit_quant_type="nf4",
            bnb_4bit_compute_dtype="bfloat16",
            bnb_4bit_use_double_quant=True,
        )
        with no_ssl_verification():
            

            
            self.tokenizer = AutoTokenizer.from_pretrained(
                    args.model_choice,
                    cache_dir = cache_dir,
                    token = '    ',
                    # attn_implementation="flash_attention_2"

                    )
            self.tokenizer.pad_token = self.tokenizer.eos_token
            self.tokenizer.pad_token_id = self.tokenizer.eos_token_id            
            self.model = AutoModelForCausalLM.from_pretrained(
                    args.model_choice, 
                    cache_dir = cache_dir,
                    quantization_config=quant_config,
                    device_map='auto',
                    token = '    ',
                    # attn_implementation="flash_attention_2"
                    )

        self.tokenizer.pad_token = self.tokenizer.eos_token
    
    def sentence_probabilities(self, sentences):
        with torch.no_grad():
            sentence_tokens = self.tokenizer(sentences, return_tensors='pt', padding=True)
            sentence_token_ids = sentence_tokens.input_ids.cuda()

            # Little hack to cut down inference time by 4-5x (leads to some imprecisions when using quantization)
            # Find the common prefix and run it through the model once, to save time
            first_different_token = (sentence_token_ids == sentence_token_ids[0, :].unsqueeze(0)).all(dim=0).long().argmin()
            common_prefix = sentence_token_ids[0, :first_different_token].unsqueeze(0)
            common_prefix_output = self.model(common_prefix, use_cache=True)
            common_prefix_key_values = tuple(tuple(tensor.expand(len(sentences), -1, -1, -1) for tensor in layer) 
                                             for layer in common_prefix_output.past_key_values)

            # Process the rest of the sentences
            rest_outputs = self.model(sentence_token_ids[:, first_different_token:], past_key_values=common_prefix_key_values)
            logits = torch.concat([common_prefix_output.logits.expand(len(sentences), -1, -1), rest_outputs.logits], dim=1).cuda()
            log_probs = logits.log_softmax(-1)
            log_probs = log_probs[:, :-1, :].gather(2, sentence_token_ids[:, 1:][:, :, None]).squeeze(-1).cuda()
            log_probs = (log_probs*sentence_tokens.attention_mask.cuda()[:, 1:]).sum(-1).cpu()
        return log_probs
    def nli(self, sentences, unknown):
        # true_probs = self.sentence_probabilities(sentences + " True.")
        # false_probs = self.sentence_probabilities(sentences + " False.")q[]
        # maybe_probs = self.sentence_probabilities(sentences + " Maybe.")
        if unknown:
            true_probs, maybe_probs, false_probs =  (self.sentence_probabilities([sentences + "(A)", sentences + "(B)", sentences + "(C)"]))
            return {'True': true_probs, 'Maybe': maybe_probs, 'False': false_probs}
        else:
            true_probs, false_probs =  (self.sentence_probabilities([sentences + "True", sentences + "False"]).softmax(-1))
            return {'True': true_probs, 'False': false_probs}
    def yn(self, sentences, norm=True, relaxed=False, obvious=False, fewshot=None, maybe=False):
        yns = []
        for sentence in sentences:
            if fewshot:
                sentence = fewshot + sentence
            
            if relaxed:
                yns.append(sentence + "Most likely")
                yns.append(sentence + "Not necessarily")
            elif obvious:
                yns.append(sentence + "obviously true.")
                yns.append(sentence + "not obviously true.")
            elif maybe:
                yns.append(sentence + "Yes")
                yns.append(sentence + "Maybe")
                yns.append(sentence + "No")
            else:
                yns.append(sentence + "Yes")
                yns.append(sentence + "No")
        # if norm:
        #     norms = self.sentence_probabilities(sentences)
        probs = []
        batch_size = 256
        for i in range(0, len(yns), batch_size):
            if i+batch_size < len(yns):
                probs += list(self.sentence_probabilities(yns[i:i+batch_size]))
            else: 
                probs += list(self.sentence_probabilities(yns[i:]))
        probs=torch.tensor(probs)
        #   
        # probs = (self.sentence_probabilities(yns))
        # probs = torch.exp(probs)
        pyes = []
        pno = []
        pmaybe = []
        if maybe:
            z = 3
        else:
            z = 2
        for i in range(0,len(probs), z):
            # if yns[i] not in cache.keys():
                # yes, no = self.sentence_probabilities([yns[i], yns[i+1]])
            
            if maybe:
                
                yes, maybe, no = probs[i], probs[i+1], probs[i+2]
                
                      
            else:
                yes, no = probs[i], probs[i+1]
            if norm:
                if maybe: 
                    y,m,n = torch.tensor([yes, maybe, no]).softmax(-1)
                else:
                    y,n = torch.tensor([yes, no]).softmax(-1)
              
                # cache[yns[i]] = y
                # cache[yns[i+1]] = n
                pyes.append(y)
                pno.append(n)
                if maybe:
                    pmaybe.append(m)
            else:
                pyes.append(1-yes/(yes + no))
            # else:
            #     y, n = cache[yns[i]], cache[yns[i+1]]
            #     pyes.append(y)
                # pno.append(n)/
        # print('cache length', len(cache))
        # if maybe:
        
        if maybe: return torch.stack([torch.tensor(pyes), torch.tensor(pmaybe), torch.tensor(pno)])
        return torch.tensor(pyes), torch.tensor(pmaybe), torch.tensor(pno)
    def complete(self, prompt, max_new = 25, temp = 0.9 , topk=0, gc = None):
        max_length = args.max_length
        encode_ids = self.tokenizer(
        prompt, 
        return_tensors='pt',
        padding=True,
        truncation=True,
        max_length=3000
    ).input_ids.cuda()
        gc = GenerationConfig(temperature=temp, do_sample=True, topk=0, max_length=1000, max_new_tokens=max_new, return_dict_in_generate=True, output_scores=True, pad_token_id=self.tokenizer.eos_token_id)
        generated_outputs = self.model.generate(
        encode_ids, 
        generation_config = gc
        )
        responses = self.tokenizer.batch_decode(
            generated_outputs.sequences,
            skip_special_tokens=True
        )
        return responses
        
# llm = LLM()
llm = None
import shutil

def get_bb(file, del_sols=None, seedrun=None):
    bb = {'pos':  [], 'neg': []}
    
    files = ['/'.join(file.split('/')[:-1]) + '/pos_' + file.split('/')[-1], '/'.join(file.split('/')[:-1]) + '/neg_' + file.split('/')[-1] ]
    for i in range(len(files)):
        file = files[i]
        shutil.copy(file, '/'.join(file.split('/')[:-2]) + '/tempfiles/' + str(file.split('/')[-1]))
        if not del_sols==None:
            if 'pos' in file:
                if 'neg' in file:
                    print('l. 416 uh oh')
                      
                ds = del_sols['pos']
            elif 'neg' in file:
                ds = del_sols['neg']
            for sol in ds:
                add_clause('/'.join(file.split('/')[:-2]) + '/tempfiles/' + str(file.split('/')[-1]))
                cf = open(f'/'.join(file.split('/')[:-2]) + '/tempfiles/' + str(file.split('/')[-1]), 'a')
                write_str = '\n'
                for lit in sol:
                    write_str += str(-lit) + ' '
                # write_str += '0'
                cf.write(write_str)
                cf.close()
        # print('running cadical')
        os.system("timeout 5000 " + USER_PATH + "/LLM-project/cadiback/cadiback " + '/'.join(file.split('/')[:-2]) + '/tempfiles/' + str(file.split('/')[-1]) + '> '  + '/'.join(file.split('/')[:-2]) + '/tempfiles/' + str(file.split('/')[-1])[:-4] + ".bbone")
        #   
        bbone= open('/'.join(file.split('/')[:-2]) + '/tempfiles/' + str(file.split('/')[-1])[:-4] + ".bbone", 'r')
        lines = bbone.readlines()
        #   
        for line in lines:
            if line.startswith('b'):
                #   
                lits = line.split(' ')[1:]
                for lit in lits:
                    lit = lit.strip()
                    if lit == '0':
                        continue
                    lit = int(lit)
                    if 'pos' in file:                                
                        if 'neg' in file:
                            print('l. 447 uh oh')
                              
                        bb['pos'].append(lit)
                    elif 'neg' in file:
                            bb['neg'].append(lit)

    return bb
# c = USER_PATH + '/LLM-project/dimacs_pronto_clutrr_csvs/solver_finished.csv'
import csv
import json
ablate = False
noisy_data=[]
seedrun = 'quail_1_11'
# config = 'gc shortened cot,cot thresh 1, temp1, mistral, quicksolve only once, '
config = 'if jb==0, M7' + seedrun
# config = 
# thresh=0.8
# dynamic=True
# context_thresh=0.5
# ruleethresh=0.4
try:
    os.mkdir('/home/XXXX/home/XXXX/6_26_backup/fs_backup_feb13/LLM-project/tempfiles' + str(seedrun) + '/')
    os.mkdir('/home/XXXX/home/XXXX/6_26_backup/fs_backup_feb13/LLM-project/workfiles' + str(seedrun) + '/')
except:
    print('dir already exists')
# os.environ["CUDA_VISIBLE_DEVICES"] = str(seedrun.split('_')[1])

# mistr_data = ['clutrr10.cnf']
# bad_data = ['proofd5153.cnf', 'proofd5227.cnf']
bad_data = []
mistr_data = []
c = USER_PATH + '/LLM-project/dimacs_quail_csvs/solver_finished.csv'
import csv
# import json
import pickle as pkl
dataset = '/home/XXXX/clause/dataset/new_quail.pkl'
with open(dataset, 'rb') as df:
    data = pkl.load(df)
# breakpoint()
task = 'folio'
missed=False
c = open(c, 'r')
cr = csv.reader(c)
names = []
all_outs = {}
missed_list = []
labels = {}
skiprow = True
for row in cr:
    if skiprow: 
        skiprow=False
        continue
    if row[2] == 'SAT' and row[3] == 'SAT':
    # if 1 > 0:
        cnf = open(USER_PATH + '/LLM-project/dimacs_quail/pos_'+row[1]).readlines()[0].strip('\n')
        num_clause = int(cnf.split(' ')[-1])
        if row[1] in noisy_data or row[1] in mistr_data:
            print('noisy or mistranslate')
            continue
        if task=='folio':
            bb = get_bb(USER_PATH + '/LLM-project/dimacs_quail/'+row[1], seedrun=seedrun)
            jb = set(bb['pos']).intersection(set(bb['neg']))
            if len(jb) == 0:
                print("jb = 0", USER_PATH + '/SAT-LM/tmp/' + row[1][:-4] + '.py')
                continue
        # if num_clause > 500:
            # continue
        if row[1] in bad_data:
            print('bad data')
            continue
        names.append(row[1])
        

        labels[row[1]] = data[int(row[1].split('proofd5')[1].split('.')[0])]['label']
#   
preds = {}
# breakpoint()

from tqdm import tqdm
#   
llm = LLM()
#   
# names = ['proofd537.cnf']
uhohs = []
times = {}
acc = 0
counter = 0
total_rule_scores = {}
hunh_list = []
cot_list = []
cot_acc = 0
skipped = 0
timeouts = 0

from tqdm import tqdm
votes = {}
n_fewshot = 4
    
# few_shot = "Here is some context: \n\"I wo n't be holding her hand , I wo n't be sitting with her while they figure out what bus she will ride ," + \
#     "I wo n't be standing on the sidelines , crying , saying goodbye to our summer . Instead , I will pack her lunch , give her a smooch , " + \
#     "tell her I love her and to have a great day at school then I will watch her walk out the door with her friend and wave as they gossip the" + \
#     " whopping block to the shuttle bus . I will most definitely cry after she walks out the door . I already have .\"\n" + \
#     "Here are some additional facts and rules we\'ve found, written in logical form: \n" + \
#     "my_daughter(her) \n walk_out_alone(her) IMPLIES independent(her)\n" + \
#     "Question: \n\"Why might I not walk her to the bus stop ?\"\n" + \
#     "Students answer: \n\"Because she is getting old enough to walk to the bus stop with her friends without my supervision .\"\n" + \
#     "Instruction: determine if the student\'s answer is True or False.\n" + \
#     "Let\'s think step by step. \n1. We know that the girl is the narrator's daughter. " + \
#     "\n2. Since the daughter is allowed to walk out alone, she is becoming independent." + \
#     "\n3. Children become independent as they get older." + \
#     "\n4. Therefore, the answer \"Because she is getting old enough to walk to the bus stop with her friends without my supervision\" is True\n" + \
#     "Here is some context: \n\"I am sitting here in my house in PJ 's sick as a dog ." + \
#     "I had so many plans . I was going to swing by Nessa 's party before going over to Rob 's party where I would have met up with my husband .\"\n" + \
#     "Here are some additional facts and rules we\'ve found, written in logical form: \n" + \
#     "sick(me)\n going_to(husband, Robs_party)\n sick(me) IMPLES Not(going(me, Robs_party))\n" + \
#     "Question: \n\"What would have happened had the narrator not gotten sick ?\"\n" + \
#     "Students answer: \n\"They would not have gone to the parties\"\n" + \
#     "Instruction: determine if the student\'s answer is True or False.\n" + \
#     "Let\'s think step by step. \n1. The narrator is sick, so the narrator is not going to any parties."  + \
#     "\n2. So, if the narrator had not been sick, they would go to the parties." + \
#     "\n3. Therefore, the students answer \"They would not have gone to the parties\" is False\n\"" + \
#     "Here is some context: \n\"The barbecue ended up being cooked inside and so we had some burgers and sausages . "+\
#     "It was quite nice . I left after about three hours . The only person that I knew there was Alice , so I was quite uncomfortable .\"\n" + \
#     "Here are some additional facts and rules we\'ve found, written in logical form: \n" + \
#     "at_barbecue(Alice)\n" + \
#     "Question: \n\"Why is the room so smoky ?\"\n" + \
#     "Students answer: \n\"They cooked meat in it .\"\n" + \
#     "Instruction: determine if the student\'s answer is True or False.\n" + \
#     "Let\'s think step by step. \n1. Barbecues create smoke. \n2. The barbecue was cooked inside. \n3. This means there was smoke inside." + \
#     "\n4. Therefore, the student\'s answer \"They cooked meat in it .\" is True\n" + \
#     "Here is some context: \n\"She was now in a car with him , so close , yet so far away . " + \
#     "She wanted to reach out and touch him , but feared rejection and instead left her twitching hands in her lap . " + \
#     "Sad that their short time in the car was over , she stalled , making her movements slow and weighing out her words .\"\n" + \
#     "Here are some additional facts and rules we've found, written in logical form: \n" + \
#     "feared_rejection(she) IMPLIES shy(she)" + \
#     "Question: \n\"Why would she fear a rejection from a man who 's giving her a ride ?\"\n" + \
#     "Students answer: \n\"Because she is secure about herself\"\n" + \
#     "Instruction: determine if the student\'s answer is True or False.\n" + \
#     "Let\'s think step by step. \n1. since she fears rejection, we know she is shy.\n2. People are shy if they are insecure or easily embarassed" + \
#     "\n3. Therefore, the students answer \"Because she is secure about herself\" is False."

few_shot = "Here is some context: \n\"I wo n't be holding her hand , I wo n't be sitting with her while they figure out what bus she will ride ," + \
    "I wo n't be standing on the sidelines , crying , saying goodbye to our summer . Instead , I will pack her lunch , give her a smooch , " + \
    "tell her I love her and to have a great day at school then I will watch her walk out the door with her friend and wave as they gossip the" + \
    " whopping block to the shuttle bus . I will most definitely cry after she walks out the door . I already have .\"\n" + \
    "Question: \n\"Why might I not walk her to the bus stop ?\"\n" + \
    "Students answer: \n\"Because she is getting old enough to walk to the bus stop with her friends without my supervision .\"\n" + \
    "Instruction: determine if the student\'s answer is True or False.\n" + \
    "Let\'s think step by step. \n1. We know that the girl is the narrator's daughter. " + \
    "\n2. Since the daughter is allowed to walk out alone, she is becoming independent." + \
    "\n3. Children become independent as they get older." + \
    "\n4. Therefore, the answer \"Because she is getting old enough to walk to the bus stop with her friends without my supervision\" is True\n" + \
    "Here is some context: \n\"I am sitting here in my house in PJ 's sick as a dog ." + \
    "I had so many plans . I was going to swing by Nessa 's party before going over to Rob 's party where I would have met up with my husband .\"\n" + \
    "Question: \n\"What would have happened had the narrator not gotten sick ?\"\n" + \
    "Students answer: \n\"They would not have gone to the parties\"\n" + \
    "Instruction: determine if the student\'s answer is True or False.\n" + \
    "Let\'s think step by step. \n1. The narrator is sick, so the narrator is not going to any parties."  + \
    "\n2. So, if the narrator had not been sick, they would go to the parties." + \
    "\n3. Therefore, the students answer \"They would not have gone to the parties\" is False\n\"" + \
    "Here is some context: \n\"The barbecue ended up being cooked inside and so we had some burgers and sausages . "+\
    "It was quite nice . I left after about three hours . The only person that I knew there was Alice , so I was quite uncomfortable .\"\n" + \
    "Question: \n\"Why is the room so smoky ?\"\n" + \
    "Students answer: \n\"They cooked meat in it .\"\n" + \
    "Instruction: determine if the student\'s answer is True or False.\n" + \
    "Let\'s think step by step. \n1. Barbecues create smoke. \n2. The barbecue was cooked inside. \n3. This means there was smoke inside." + \
    "\n4. Therefore, the student\'s answer \"They cooked meat in it .\" is True\n" + \
    "Here is some context: \n\"She was now in a car with him , so close , yet so far away . " + \
    "She wanted to reach out and touch him , but feared rejection and instead left her twitching hands in her lap . " + \
    "Sad that their short time in the car was over , she stalled , making her movements slow and weighing out her words .\"\n" + \
    "Question: \n\"Why would she fear a rejection from a man who 's giving her a ride ?\"\n" + \
    "Students answer: \n\"Because she is secure about herself\"\n" + \
    "Instruction: determine if the student\'s answer is True or False.\n" + \
    "Let\'s think step by step. \n1. since she fears rejection, we know she is shy.\n2. People are shy if they are insecure or easily embarassed" + \
    "\n3. Therefore, the students answer \"Because she is secure about herself\" is False."

    
answers = ['true', 'false']
import time
time_str = str(time.ctime()).replace(' ', '_').replace(':', '.')

answers = ['true', 'false']
import time
time_str = str(time.ctime()).replace(' ', '_').replace(':', '.')
skip_pbar=True
import argparse 

parser = argparse.ArgumentParser(
                prog='ProgramName',
                description='What the program does',
                epilog='Text at the bottom of help')

parser.add_argument('-seedrun')

pargs = parser.parse_args()
seedrun = pargs.seedrun

# idxs = pkl.load(open('/home/XXXX/quail_idxs.pkl', 'rb'))
idxs = list(range(500))


for z in tqdm(range(20)):
    acc = 0
    total = 0
    preds = []
    accs = {}
    i = 0
    for i in idxs:
        name = 'proofd5' + str(i) + '.cnf'
        print('sc iteration: ' + str(z))
        print('datapoint: ' + str(i))
        # i += 1
        if name not in votes.keys():
            votes[name] = torch.tensor([0.0, 0.0])
        

        prob = data[i]
       

 
        prompt = few_shot +  'Here is some context: \n' + prob['context'] + '\nQuestion: \n\"' + prob['question'] + '\"\nStudents answer: \n\"' + prob['query'] + '\"\n'+ '"Instruction: determine if the student\'s answer is True or False.\n Let\'s think step by step. \n1.' 
  
        ans = llm.complete(prompt, max_new=1000)[0]
        # if len(ans.split('Facts')) > 7:
        #     ans = 'Facts'.join(ans.split('Facts')[:5])
        ans_prompt = ans + "Therefore, the answer (True/False) is "
       
        ans_prompt = 'Here is some context:' + ans.split('Here is some context:')[n_fewshot+1] + "Therefore, the answer (True/False) is "
        # nli = torch.tensor(list(llm.nli(ans_prompt, False).values()))
        # votes[nli.argmax()] += 1.0
        # print(nli)
        # print(ans_prompt)
        # continue  
        # answer = answers[torch.argmax(nli)]
        # breakpoint()

        # ans = ans.split('***')[n_fewshot]

        # try: lines = ans.split('\n')
        # except: breakpoint()
        # i = -1
        # prob['label'] = str(prob['label'] == 'entailment').lower()
        notherefore=False
        try: 
            m = ans_prompt.split('Therefore')[1]
            if 'Yes' in m: 
                nli = torch.tensor([1,0])
                # print('[1,0]')
                # print(ans_prompt)
                # continue
    
            elif 'No' in m: 
                nli = torch.tensor([0,1])
                # print('[0,1]')
                # print(ans_prompt)
                # continue
            else: 
                nli = torch.tensor(list(llm.nli(ans_prompt, False).values())).softmax(-1)
            # votes += nli.softmax(-1)
        except: 
            nli = torch.tensor(list(llm.nli(ans_prompt, False).values())).softmax(-1)
        # nli = torch.tensor(list(llm.nli(ans_prompt, unknown).values()))    
        answer = answers[torch.argmax(nli)]
        votes[name] += nli
        s_probs, ind = torch.sort(nli)
        print(ans_prompt)
        print(nli)
        print(prob['label'].strip(' ').lower())
        # answer = answers[ind[-1]]
        # if s_probs[-1] < torch.sum(s_probs[:-1]):
        #     answer=answers[1]
        if answer.strip(' ') == prob['label'].strip(' ').lower():
            acc += 1
            accs[name] = 1
        # print(answer, prob['label'])
        # if answer == 'Unknown':
        #     print('maybe')
        # if prob['answer'] == 'Unknown':
        #     print('maybe is correct')
        total += 1
        preds.append(answer)
        # run_log = open(run_log_path, 'a')
        # run_log.write(str(ans) + '\n')
        # run_log.write(str(nli) + '\n')
        
        # if answer.strip(' ') == labels[name].strip(' '):
        #     run_log.write('Correct: ' + answer + '\n')
        # else:
        #     run_log.write('Incorrect: (pred,real): ' + answer + ', ' + labels[name] + '\n')
        # run_log.close()
        print('running acc: ', acc, '/', total)
    print(acc, '/', total)
    # run_log = open(run_log_path, 'a')
    # run_log.write('Few-Shot COT Accuracy CLUTRR iter ' + str(z) + ': ' + str(acc) + '/' + str(total) + '\n')
    # run_log.close()
    file = open(USER_PATH + 'LLM-project/preds/L8_FewShotCOT_newquail_good_' + time_str + '_iter' + str(z), 'wb')
    np.save(file, preds)
    file.close()
    file = open(USER_PATH + 'LLM-project/preds/L8_FewShotCOT_newquail_votes_good_' + time_str + '_iter' + str(z), 'wb')
    np.save(file, votes)

    file = open(USER_PATH + 'LLM-project/preds/L8_FewShotCOT_newquail_accs_good_' + time_str + '_iter' + str(z), 'wb')
    np.save(file, accs)

    file.close
        # breakpoint()
# breakpoint()



