import re
groundtruth = [line.rstrip() for line in open("codeline_groundtruth.txt", "r").readlines()]
normallines = [line.split("</s>")[-2].split("[/INST]")[-1] for line in open("normal_codeline_outputs.txt", "r").readlines()]
perturbedlines = [line.split("</s>")[-2].split("[/INST]")[-1] for line in open("perturbed_codeline_outputs.txt", "r").readlines()]
print(perturbedlines)
print(normallines)
perturbedcorrect = 0
normalcorrect = 0
perturbedlength = 0
normallength = 0
for i in range(len(groundtruth)):
    print(perturbedlines[i], i)
    if re.search(r"(?:\s|^)[A-D](?=\s|[.,!?]|$)", perturbedlines[i]) != None:
        #print(re.search(r'(?:\s|^)[A-D](?=\s|[.,!?]|$)', perturbedlines[i]).group().strip())
        if groundtruth[i] == re.search(r'(?:\s|^)[A-D](?=\s|[.,!?]|$)', perturbedlines[i]).group().strip():
            perturbedcorrect += 1
        perturbedlength += 1
    if re.search(r"(?:\s|^)[A-D](?=\s|[.,!?]|$)", normallines[i]) != None:
        #print(re.search(r'(?:\s|^)[A-D](?=\s|[.,!?]|$)', normallines[i]).group().strip())
        if groundtruth[i] == re.search(r'(?:\s|^)[A-D](?=\s|[.,!?]|$)', normallines[i]).group().strip():
            normalcorrect += 1
        normallength += 1
print("Normal:", normalcorrect / normallength)
print("Perturbed:", perturbedcorrect / perturbedlength)
print(normallength, perturbedlength)