import pandas as pd
import csv
import json
class args:
    base_path="/tofu/min_var_cluster_0_removed_outliers_switch_idk_result.csv"
    base_path="/tofu/{}.csv"
    outpath_jb = "/tofu/all_results_jb.csv"
    outpath = "/tofu/all_results.csv"

def gather_results(args):
    all_results = []
    topics = json.load(open("/wiki/topics.json", "r"))[:6]


    for i in range(5,6,1):
        
        for var in ['bert_']:#["emb_ans_"]:#["bert_"]: #["random_"]: #["min_var_"]: #["_min_var"]
            name = var+"cluster_"+str(i)+"_base_jailbreak_result"
            
            cur_line = open(args.base_path.format(name)).readlines()[0]
            # import pdb;pdb.set_trace();
            # values = cur_line.split(',')
            # values = [v for i, v in enumerate(values) if i not in range(8,16,1)]
            # processed_line = ','.join(values)

            all_results.append(name+","+cur_line)
            cur_line = open(args.base_path.format(name)).readlines()[1]
            # values = cur_line.split(',')
            # values = [v for i, v in enumerate(values) if i not in range(8,16,1)
            # processed_line = ','.join(values)
            # import pdb;pdb.set_trace();
            
            all_results.append(name+","+cur_line)
            for unlearn in ["_switch_unlearn_"]: #["_switch_idk_result"]:#["_base_result"]: #"_switch_unlearn_result", "_switch_idk_result"]:
                for type in [""]: #[""]: #["","_subsampled", "_removed_outliers"]:   
                    for k in range(10):             
                        name = var+"cluster_"+str(i)+"_"+var+"cluster_"+str(i)+type+unlearn+str(12*(k+1))+"_lora1_c2_{}_jailbreak_result".format(k)
                        # if k==0:
                        #     all_results.append(name+","+open(args.base_path.format(name)).readlines()[0])
                        # cur_line = name+","+open(args.base_path.format(name)).readlines()[1]
                        # values = cur_line.split(',')
                        # values = [v for i, v in enumerate(values) if i not in range(8,16,1)]
                        # processed_line = ','.join(values)
                        # all_results.append(processed_line)    
                        all_results.append(name+","+open(args.base_path.format(name)).readlines()[1])

            with open(args.outpath_jb, mode="w") as file:
                for line in all_results:
                    file.write(line)

            all_results = []
            
            name = var+"cluster_"+str(i)+"_base_result"
            
            cur_line = open(args.base_path.format(name)).readlines()[0]
            # import pdb;pdb.set_trace();
            # values = cur_line.split(',')
            # values = [v for i, v in enumerate(values) if i not in range(8,16,1)]
            # processed_line = ','.join(values)

            all_results.append(name+","+cur_line)
            cur_line = open(args.base_path.format(name)).readlines()[1]
            # values = cur_line.split(',')
            # values = [v for i, v in enumerate(values) if i not in range(8,16,1)
            # processed_line = ','.join(values)
            # import pdb;pdb.set_trace();
            
            all_results.append(name+","+cur_line)
            for unlearn in ["_switch_unlearn_"]: #["_switch_idk_result"]:#["_base_result"]: #"_switch_unlearn_result", "_switch_idk_result"]:
                for type in [""]: #[""]: #["","_subsampled", "_removed_outliers"]:   
                    for k in range(10):             
                        name = var+"cluster_"+str(i)+"_"+var+"cluster_"+str(i)+type+unlearn+str(12*(k+1))+"_lora1_c2_{}_result".format(k)
                        # if k==0:
                        #     all_results.append(name+","+open(args.base_path.format(name)).readlines()[0])
                        # cur_line = name+","+open(args.base_path.format(name)).readlines()[1]
                        # values = cur_line.split(',')
                        # values = [v for i, v in enumerate(values) if i not in range(8,16,1)]
                        # processed_line = ','.join(values)
                        # all_results.append(processed_line)    
                        all_results.append(name+","+open(args.base_path.format(name)).readlines()[1])

    with open(args.outpath, mode="w") as file:
        for line in all_results:
            file.write(line)

if __name__ == "__main__":
    gather_results(args)








