from pathlib import Path

import numpy as np
import tensorflow as tf

import cfg


def do(df, dataset, weight_init, training, training_paradigm):
    # load x_data
    if weight_init == 'tl' and training == 'frozen' and training_paradigm != 'augmented':
        x_data = np.load(Path(cfg.path_data, dataset, 'data_embedding.npy'))
    # read data
    elif dataset in ['scene', 'letter', 'mscoco', 'cifar10']:
        x_data = np.load(Path(cfg.path_data, dataset, 'data.npy'))

    # filter x_data, use only the samples available in the df
    x_data_filtered = x_data[df.index.to_numpy()]

    # load y_data
    label_cols = [col for col in df.columns if col.startswith(cfg.label_prefix)]
    y_data = df[label_cols].to_numpy()

    # reset df indices
    df = df.reset_index(drop=True)

    return x_data_filtered, y_data, df