import h5py
import numpy as np
import os


def average_data(algorithm="", dataset="", goal="", times=10):
    """
    Compute and print the mean and standard deviation of the best test accuracy over multiple runs.

    Args:
        algorithm (str): Algorithm name.
        dataset (str): Dataset name.
        goal (str): Experiment goal.
        times (int): Number of experiment runs.
    """
    test_acc = get_all_results_for_one_algo(algorithm, dataset, goal, times)

    max_accurancy = []
    for i in range(times):
        max_accurancy.append(test_acc[i].max())

    print("std for best accurancy:", np.std(max_accurancy))
    print("mean for best accurancy:", np.mean(max_accurancy))


def get_all_results_for_one_algo(algorithm="", dataset="", goal="", times=10):
    """
    Retrieve test accuracy results for one algorithm over multiple runs.

    Args:
        algorithm (str): Algorithm name.
        dataset (str): Dataset name.
        goal (str): Experiment goal.
        times (int): Number of experiment runs.

    Returns:
        list: List of numpy arrays containing test accuracy for each run.
    """
    test_acc = []
    algorithms_list = [algorithm] * times
    for i in range(times):
        file_name = dataset + "_" + algorithms_list[i] + "_" + goal + "_" + str(i)
        test_acc.append(np.array(read_data_then_delete(file_name, delete=False)))

    return test_acc


def read_data_then_delete(file_name, delete=False):
    """
    Read test accuracy data from an HDF5 file and optionally delete the file.

    Args:
        file_name (str): Name of the result file (without extension).
        delete (bool): Whether to delete the file after reading.

    Returns:
        np.ndarray: Array of test accuracy values.
    """
    file_path = "../results/" + file_name + ".h5"

    with h5py.File(file_path, 'r') as hf:
        rs_test_acc = np.array(hf.get('rs_test_acc'))

    if delete:
        os.remove(file_path)
    print("Length: ", len(rs_test_acc))

    return rs_test_acc