import pandas as pd
import numpy as np
import time
from AttributesSelection import attribution_select_Dis, attribution_select, transpose_list
from EquilibriumParameter import feature_distribution_up_0, equilibrium_state_parameter_set
from LongRunTraining import long_run_equilibrium_l
from PredictiorForPoint import ESE_predictor_system_ar
from StateParameter import state_parameter_set
from Correlation import attribution_correlate_coe

raw_data_attribute = pd.read_csv("demo_er/attribute/try1.csv")

raw_data_attribute = np.array(raw_data_attribute)

number_part = 16# the number of all part
name_part = raw_data_attribute[:, 0]

############################################
# for choosing attributes
############################################

attribute_list = {2, 3, 4, 5, 6, 7, 8, 9, 10, 11}#, 12, 13, 14, 15, 16, 17, 18, 19}



time_record = []
prediction = []
for t in range(1000):

    ###########################################
    # setting for time period
    ###########################################

    start = -100 + t  # ceg ipo only 60 days
    end = -1 + t
    number_time_unit = end - start
    ######## load daily data ################

    date = pd.read_csv("demo_er/AUD.csv")
    date = np.array(date)
    date = date[start:end, 0].astype(str)

    # number_name = range(len(name_part)) # number of part names

    # number_name = range(len(name_part))
    raw_data = []  #### !!! revise raw_data -> a matrix of raw records, each column represents a time unit, e.g. a day or an hour, each row represnts data of a part/system at different time units ###

    raw_data_sum = []  #### raw_data_sum -> 1D array, each element is the sum of all parts at a particular time point

    ##### load daily data raw and attribute data #####
    target_data = 5  # select the target variable data

    for i in range(number_part):
        share = pd.read_csv("demo_er/" + name_part[i] + ".csv")  # read the daily data
        part = np.array(share)
        data = part[start:end, target_data].astype(float)  ### 5 is hard code  target data column
        # data = part[:, target_data].astype(float)  ### 5 is hard code  target data column
        raw_data.append(data)
        # raw_data.extend(data)

    ###  Transpose the data matrix so each row is systems/parts at a particular time point,
    ###  while each column is the time series of a system/part
    daily_state = list(map(list, zip(*raw_data)))
    # raw_data = np.asarray(raw_data)
    # daily_state = np.transpose(raw_data)
    # print(daily_state[100])

    ### Calculate the sum of all parts, e.g. sum of one row
    for i in range(len(daily_state)):
        total = sum(daily_state[i])
        raw_data_sum.append(total)
    print(raw_data_sum)

    ### spss is a collection of sps, the state parameter set for one time point
    spss = []
    for i in range(len(raw_data[0])):  # test_start+h_start-1 is t_0
        sps = state_parameter_set(daily_state[i])
        sps = sps.astype(float)
        spss.append(sps)

    ### attribute selection based on Dis
    method_choose = 1  # 1 is the EI method based on Euclidean distance, 2 is based on difference

    selected_attribute_list = attribution_select(method_choose, raw_data_attribute, spss, attribute_list)
    number_attribute = len(selected_attribute_list)

    ### data of selected attributes
    selected_attribute_set = raw_data_attribute[:, selected_attribute_list]




    start_time = time.time()

    ### Calculate the correlation between the state parameter set and the last data point which is the prediction target

    model = 3  ### 3 is the switch value for OLS

    correlates = attribution_correlate_coe(model, selected_attribute_set, spss[-1])

    ### sum of the absoluton values of correlations
    sum_cor = sum(abs(correlates))  ### sum_correlation

    ### generate feature values for each attribute under all systems/parts
    x = 0
    for i in range(number_attribute):
        a = feature_distribution_up_0(selected_attribute_set[:, i], correlates[i])
        x += a

    ### equilibrium sps, initial value
    esps_0 = equilibrium_state_parameter_set(sum_cor, number_attribute, number_part, x)

    ### long run equilibirum training
    esps = long_run_equilibrium_l(esps_0, spss, 2)

    ### prediction based on the trained esps
    p = ESE_predictor_system_ar(raw_data_sum, esps,
                                3)  ### default prediction distance = 1, h is for setting the prediction distance

    ### p = daily_data_total_raw[-1]*esps ### prediction with just esps based on historical data

    prediction.append(p)

    end_time = time.time()  # 1657267201.6171696

    time1 = end_time - start_time
    time_record.append(time1)


# csv
result_record = np.array(prediction)
np.array(result_record)
save = pd.DataFrame(result_record)
save.to_csv('result.csv', index=False, header=False)

time_record = np.array(time_record)
time_record = time_record.T
np.array(time_record)
save = pd.DataFrame(time_record, columns=['time'])
save.to_csv('time.csv', index=False, header=False)

print('finish')