import os
import random
import time
from collections import defaultdict
from pathlib import Path

import numpy as np
from baseline import INFERENCE

datset_dir = "data"


def setup_seed(seed=42):
    np.random.seed(seed)
    random.seed(seed)


def get_report(abbrev, dataset_path, algorithm):

    label = dataset_path / "label.csv"
    truth = dataset_path / "truth.csv"
    seeds = [42]
    report = defaultdict(list)
    times = []
    for seed in seeds:
        setup_seed(seed)
        # compute time
        start = time.time()
        rep = INFERENCE(label, truth, alg=algorithm).infernce()[1]
        for key, value in rep.items():
            report[key].append(value)
        end = time.time()
        times.append(end - start)
    return report, np.mean(times)


algs = ["MV", "DS", "PM", "CATD", "BWA", "IBCC", "EBCC", "GLAD"]
# algs = ["MV", "DS", "PM", "CATD", "BWA", "IBCC", "EBCC"]
for abbrev in sorted(os.listdir(datset_dir)):
    dataset_path = Path(datset_dir) / abbrev
    for alg in algs:
        print(abbrev, alg)
        report, times = get_report(abbrev, dataset_path, alg)
        with open("report.csv", "a") as f:
            for key, value in report.items():
                f.write(f"{abbrev},{alg},{key},{np.mean(value)},{np.std(value)},{np.mean(times)}\n")
