dir_ = "./" # directory
N = 10000 # number of instances

import pandas as pd
from statistics import mean
from Conversion import EfficientConversion
iter_n = 10
m_list = [3, 5, 4, 4, 4, 6] 
for num_, data in enumerate(["insurance", "water", "alarm", "barley", "hailfinder", "hepar2"]):
    m = m_list[num_]
    lambda0 = []
    lambda12 = []
    ratio1 = []
    ratio2 = []
    bits1 = []
    bits2 = []
    for num in range(iter_n):
        CPS0 = pd.read_csv(dir_ + data + "/" + data + "_" + str(N) + "_true_none_" + str(num + 1) + ".csv")
        CPS = pd.read_csv(dir_ + data + "/" + data + "_" + str(N) + "_true_" + str(num + 1) + ".csv")
        EC = EfficientConversion()
        List = EC.encode(CPS)
        U_list = List[1]
        V_list = List[2]
        n = len(U_list)
        lambda0_ = len(CPS0) - n
        lambda0 += [lambda0_]
        lambda12_ = sum([len(U_list[i]) + len(V_list[i]) for i in range(n)])
        lambda12 += [lambda12_]
        ratio1 += [lambda0_ / (n * ((n - 1) ** (m/2)))]
        ratio2 += [lambda12_ / lambda0_]
        bits1_ = lambda12_ + n * (n - 1) / 2
        bits1 += [bits1_]
        bits2_ = sum([(len(U_list[i]) + len(V_list[i])) * (len(U_list[i]) + len(V_list[i]) + 1) for i in range(n)]) + n * (n - 1) / 2
        bits2 += [bits2_]
    print(data, round(mean(lambda0)), round(mean(ratio1),5), round(mean(ratio2),5), round(mean(bits1)), round(mean(bits2)))