import pandas as pd
import os.path as osp
import numpy as np
from scipy import stats
import os

from utils import mkdir_if_missing, load_dict, save_dict, segment


def data_process(d):
    f_data = d[np.where((d[:, -1] != 0) & (d[:, -1] != 12))]
    x_data = f_data[:, :-1]
    y_data = f_data[:, -1]
    x, y = segment(x_data, y_data, num_channel=num_channel, window_size=width)
    return x, y


def write_files(path, save_path):
    files = []
    for r, d, f in os.walk(path):
        for file in f:
            if '.log' in file:
                files.append(os.path.join(r, file))
    for f in files:
        print(f)

    data_dic = {}
    for file in files:
        e = file.index('.')
        st = file[-12:e]
        ns = st.index('t')
        sub = st[ns + 1:]
        data_dic[sub] = np.genfromtxt(file)

    for key in data_dic.keys():
        user = str(int(key))
        x, y = data_process(data_dic[key])
        mkdir_if_missing(osp.join(save_path, user))
        for idx, (d, l) in enumerate(zip(x, y)):
            l = str(int(l - 1))
            mkdir_if_missing(osp.join(save_path, user, l))
            file_path = osp.join(save_path, user, l, "{}_{}_{}.pkl".format(user, l, str(idx)))
            save_dict(d, file_path)
        print("User {} done!".format(user))


if __name__ == "__main__":
    width = 100
    num_channel = 23
    file_path = 'E:/SensingRawData/MHEALTH'
    save_class_path = "E:/Datasets/Source/Sensing/MHEALTH"
    write_files(file_path, save_class_path)
