import sys
import os
# 获取当前文件的绝对路径，并向上追溯到项目根目录（your_project）
current_dir = os.path.dirname(os.path.abspath(__file__))
project_root = os.path.dirname(current_dir)  # 根据实际层级调整
sys.path.append(project_root)
# import a funciton at ../datasets/datasetloader.py
from datasets.datasetloader import getdatasetpath
import pandas as pd
import numpy as np
import torch
from sklearn.metrics import roc_auc_score, accuracy_score, recall_score, precision_score, f1_score, average_precision_score
from sklearn.model_selection import train_test_split
import warnings
from sklearn.model_selection import KFold
warnings.filterwarnings("ignore")

def winsorize(data, lower=0.05, upper=0.95): 
    lower_bound = np.quantile(data, lower)
    upper_bound = np.quantile(data, upper)
    return np.clip(data, lower_bound, upper_bound)

n_exp = 1
n_group = 30
dataset_name = 'trade'
n_subjects = 20
# start of test day: day 30 -> end of test day: day 89 - 11 day= 78, 
n_days_train = 41 # 41 # start of train day: day 10, end of train days, left back 10 days, 
n_days_test = 61 # 81 # end of n days test, left back 10 days, 
n_stock = 20 # 3214, 

# ------------------------assessment of iide and bias-------------------------
p_values = {}
model_names = ['lgbm', 'xgb',] # 'linear', 'catboost'] # 'mlp', 'svm', 'rf', 'lgbm', 'xgb', 'catboost'] # , 'tabpfn']
test_names = ['iid', 'id', 'bias']
subject_names = ['lr', 'nn', 'fusion']
shap_features = ['fusion', 'subject', 'proxy', 'condition', 'subject_condition', 'subject_proxy', 'condition_proxy']

for model_name in model_names:
    for test_name in test_names:
        for subject_name in subject_names:
            p_values[f"{model_name}_{test_name}_{subject_name}"] = []
# -------------------------------------------------------------------

# ------------------------assessment of errors-------------------------
errors = {}
errors_s = {}
errors_p = {}
errors_c = {}
errors_sc = {}
errors_cp = {}
errors_sp = {}

for model_name in model_names:
    for subject_name in subject_names:
        errors[f"{model_name}_{subject_name}"] = []
        errors_s[f"{model_name}_{subject_name}"] = []
        errors_p[f"{model_name}_{subject_name}"] = []
        errors_c[f"{model_name}_{subject_name}"] = []
        errors_sc[f"{model_name}_{subject_name}"] = []
        errors_cp[f"{model_name}_{subject_name}"] = []
        errors_sp[f"{model_name}_{subject_name}"] = []
# -------------------------------------------------------------------


# add baseline model: last 10 days, 
errors['roi_last10days_fusion'] = []
errors['roi_last10days_lr'] = []
errors['roi_last10days_nn'] = []
# -------------------------------------------------------------------

for i_exp in range(n_exp):
    # ---------------------------------read dataset---------------------------------
    datasetpath = getdatasetpath(dataset_name)
    data_df = pd.read_csv(datasetpath)
    # ---------------------------------------------------------------------------------------------------

    # ---------------------------------drop specifical, sort by stock code and date---------------------------------
    stockcounts  = data_df['股票代码'].value_counts()
    data_df = data_df[data_df['股票代码'].isin(stockcounts[stockcounts==89].index)]
    data_df = data_df.reset_index(drop=True)
    data_df['日期'] = pd.to_datetime(data_df['日期']) # 89 days for each stock
    data_df['日期'] = data_df['日期'].dt.date
    data_df = data_df.sort_values(['股票代码', '日期'])
    # print("data df head: ", data_df.head(93))
    # --------------------------------------------------------------------------------

    # ------------------drop 8 days data for all stocks------------------
    # keep 1 days for the model input, 
    # data_df = data_df.groupby('股票代码').apply(lambda x: x.iloc[8:])
    data_df = data_df.reset_index(drop=True)
    # print("number of stocks: ", data_df['股票代码'].value_counts())
    # ------------------------------------------------------------------------

    # --------------------normalize EC for input of decision model--------------------
    x_column_name = ['获利比例', '平均成本', '90成本-低', '90成本-高', '90集中度',
            '70成本-低', '70成本-高', '70集中度', '收盘', '开盘', '最高', 
            '最低', '成交量', '成交额', '振幅']
    norm_df = data_df[x_column_name]
    norm_df = (norm_df - norm_df.mean()) / norm_df.std()
    # ------------------------------------------------------------------------

    # ------------------------------create subject space: decision model-----------------------------
    # subject space: logistic regression, and 2-layer NN
    # sample a subject: one decision model for every 10 days, 
    class LinearSubject(torch.nn.Module):
        def __init__(self,n_input):
            super(LinearSubject, self).__init__()
            self.linear = torch.nn.Linear(n_input, 3)
            self.linear.weight = torch.nn.Parameter(torch.rand(3, n_input)*2-1)
            self.linear.bias = torch.nn.Parameter(torch.rand(3)*2-1)
        def forward(self, x):
            linear = self.linear(x)
            # print("linear:", linear)
            softmax_output = torch.nn.functional.softmax(linear, dim=1)
            decision = torch.argmax(softmax_output, dim=1)
            return decision
    
    class NNSubject(torch.nn.Module):
        def __init__(self, n_input, maxhidden = 8):
            super(NNSubject, self).__init__()
            self.linear1 = torch.nn.Linear(n_input, maxhidden)
            self.linear2 = torch.nn.Linear(maxhidden, 3)
            self.sigmoid = torch.nn.Sigmoid()
            self.layer1 = torch.nn.Sequential(
                self.linear1,
                self.sigmoid
            )
            self.layer2 = torch.nn.Sequential(
                self.linear2,
                self.sigmoid
            )
        def forward(self, x):
            layer1_out = self.layer1(x)
            layer2_out = self.layer2(layer1_out)
            softmax_output = torch.nn.functional.softmax(layer2_out, dim=1)
            decision = torch.argmax(softmax_output, dim=1)
            return decision

    class LinearFloat(torch.nn.Module):
        def __init__(self, n_subject_input=15, subject_label='linear', max_hidden=8):
            super(LinearFloat, self).__init__()
            if subject_label == 'linear':
                n_input = n_subject_input*3+3
                self.linear = torch.nn.Linear(n_input, 1)
                self.linear.weight = torch.nn.Parameter(torch.rand(1, n_input)*2-1)
                self.linear.bias = torch.nn.Parameter(torch.rand(1)*2-1)
            elif subject_label == 'nn': # 15*8+8+8*3+3 = 120 + 8 + 24 + 3 = 155
                n_input = n_subject_input*max_hidden + max_hidden + max_hidden*3 + 3
                self.linear = torch.nn.Linear(n_input, 1)
                self.linear.weight = torch.nn.Parameter(torch.rand(1, n_input)*2-1)
                self.linear.bias = torch.nn.Parameter(torch.rand(1)*2-1)
        def forward(self, x, float_ratio = 0.001):
            linear = self.linear(x)
            output = float_ratio*(2*torch.nn.functional.sigmoid(linear)-1)
            return output
    # ---------------------------------------------------------------------------------------------------

    # ---------------------------sampling from subject space-----------------------------
    subject_lr_list = []
    subject_lr_vector_list = []
    subject_nn_list = []
    subject_nn_vector_list = []
    subject_label = []
    subject_list = []
    subject_vector_list = []
    n_input = len(x_column_name)
    for i in range(n_subjects):
        # 0: 0.5 probability to select a linear, and 1: 0.5 probability to select a NN, 
        subject_label.append(np.random.choice([0, 1]))
        n_input = len(x_column_name)
        if subject_label[-1] == 0: # create a linear subject, 
            subject = LinearSubject(n_input)
            subject_lr_list.append(subject)
            subject_lr_vector_list.append(torch.cat([p.view(-1) for p in subject.parameters()]).detach().numpy().tolist())
        else: # create a NN subject, 
            subject = NNSubject(n_input)
            subject_nn_list.append(subject)
            subject_nn_vector_list.append(torch.cat([p.view(-1) for p in subject.parameters()]).detach().numpy().tolist())
        subject_list.append(subject)
        subject_vector = torch.cat([p.view(-1) for p in subject.parameters()]).detach().numpy().tolist()
        subject_vector_list.append(subject_vector)
    # ---------------------------------------------------------------------------------------------------

    # -------------evaluation task--------------------
    # subject: logistic regression, and 2-layer NN
    #   subject input: last day's x_column, 
    #   subject output: buy, sell, or hold,
    # condition: last 10 days' x_column, 
    # metric: next 10 days' return, 
    # es: next 10 days' close price * float rate(subject), 
    # em: 
    #   input: [subject_vector, condition_vector, last 10 days' backtest return without float]
    #   output: [metric]
    # error function: RMSE
    # ------------------------------------------------
    
    # -----------------------create the metric space-------------------------------
    floatmodel_lr = LinearFloat(n_subject_input=15, subject_label='linear', max_hidden=8)
    floatmodel_nn = LinearFloat(n_subject_input=15, subject_label='nn', max_hidden=8)
    # ---------------------------------------------------------------------------------------------------
    te_subject_list = []
    te_condition_list = []
    te_metric_list = []
    te_metric_proxy_list = []
    te_subject_lr_list = []
    te_subject_nn_list = []
    te_subject_vector_list = []
    te_subject_vector_lr_list = []
    te_subject_vector_nn_list = []
    te_condition_lr_list = []
    te_condition_nn_list = []
    te_metric_lr_list = []
    te_metric_nn_list = []
    te_metric_lr_proxy_list = []
    te_metric_nn_proxy_list = []
    n_subject_tr =int(n_subjects * 0.8)
    n_subject_te = n_subjects - n_subject_tr
    errors_roi_last10days_fusion_list = []
    errors_roi_last10days_lr_list = []
    errors_roi_last10days_nn_list = []
    for i in range(n_subject_te): # every trade strategy, 400 subjects, on test,
        print(f" test exp: {i_exp}, subject: {i}") 
        for day_id in range(n_days_train, n_days_test): # start of test day: day 30 -> end of test day: day 89 - 11 day
            for stock_id in range(n_stock):
                # get the subject, 
                index = i + n_subject_tr
                subject = subject_list[index]
                subject_vector = subject_vector_list[index]
                # get the decision of the subject for the last 10 days, 
                # get the index by stock id, day_id,
                last10days_start_index = stock_id * 89 + day_id - 10
                last10days_end_index = stock_id * 89 + day_id
                next10days_start_index = stock_id * 89 + day_id
                next10days_end_index = stock_id * 89 + day_id + 10
                last10days_tensor = torch.tensor(norm_df.iloc[last10days_start_index:last10days_end_index].values, dtype=torch.float32)
                last10days_decisions = subject(last10days_tensor)
                # get the decision of the subject for the next 10 days,
                next10days_tensor = torch.tensor(norm_df.iloc[next10days_start_index:next10days_end_index].values, dtype=torch.float32)
                # get the decision of the subject for the next 10 days,
                next10days_decisions = subject(next10days_tensor)

                # get the reference metric (ROI) by apply the subject to the last 10 days,
                # decision: 0-买入，1-持有，2-卖出, holds: 0: +1, 1: +0; 2: -1,
                holds = []
                last10days_return = 0.0
                last10days_invest = 0.0
                for j in range(0, 10):
                    # get the float model input, and use the subject to get the float ratio,
                    float_input = torch.tensor(subject_vector, dtype=torch.float32)
                    if subject_label[index] == 0:
                        # print("linear", float_input.shape)
                        float_ratio = floatmodel_lr(float_input)
                    else:
                        # print("nn", float_input.shape)
                        float_ratio = floatmodel_nn(float_input)
                    
                    if last10days_decisions[j] == 0:
                        # 不能买入涨停股票
                        if last10days_tensor[:,9][j] >= 0.099:
                            holds.append(0)
                            continue
                        # 按照开盘价买入1手
                        holds.append(1)
                        last10days_return -= last10days_tensor[:,9][j] * 100 * float_ratio
                        last10days_invest += last10days_tensor[:,9][j] * 100 * float_ratio
                    elif last10days_decisions[j] == 1:
                        holds.append(0)
                    else:
                        if sum(holds) <= 0:
                            holds.append(0)
                            continue
                        # 不能卖出
                        if last10days_tensor[:,8][j] <= -0.099:
                            holds.append(0)
                            continue
                        # 按照收盘价卖出1手
                        holds.append(-1)
                        last10days_return += last10days_tensor[:,9][j] * 100 * float_ratio

                # sell all the stocks at the end of 10 days,
                if sum(holds) > 0:
                    # 跌停也按照0.9的收盘价次日平仓
                    if last10days_tensor[:,8][9] <= -0.099:
                        last10days_return += 0.9 * sum(holds) * last10days_tensor[:,8][9] * 100 * float_ratio
                    # 非跌停按照收盘价平仓
                    else:
                        last10days_return += sum(holds) * last10days_tensor[:,8][9] * 100 * float_ratio
                # calculate the return ratio,
                if last10days_invest <= 0:
                    last10days_roi = 0.0
                else:
                    last10days_roi = (last10days_return / last10days_invest - 1).item()
                
                # get the metric (roi) by apply the subject to the next 10 days, 
                # decision: 0-买入，1-持有，2-卖出, holds: 0: +1, 1: +0; 2: -1, 
                holds = []
                next10days_return = 0.0
                next10days_invest = 0.0
                for j in range(0, 10):
                    # get the float model input, and use the subject to get the float ratio, 
                    float_input = torch.tensor(subject_vector, dtype=torch.float32)
                    if subject_label[index] == 0:
                        float_ratio = floatmodel_lr(float_input)
                    else:
                        float_ratio = floatmodel_nn(float_input)
                    if next10days_decisions[j] == 0:
                        # 不能买入涨停股票
                        if next10days_tensor[:,9][j] >= 0.099:
                            holds.append(0)
                            continue
                        # 按照开盘价买入1手
                        holds.append(1)
                        next10days_return -= next10days_tensor[:,9][j] * 100 * float_ratio
                        next10days_invest += next10days_tensor[:,9][j] * 100 * float_ratio
                    elif next10days_decisions[j] == 1:
                        holds.append(0)
                    else:
                        if sum(holds) <= 0:
                            holds.append(0)
                            continue
                        # 不能卖出跌停股票
                        if next10days_tensor[:,8][j] <= -0.099:
                            holds.append(0)
                            continue
                        # 按照收盘价卖出1手
                        holds.append(-1)
                        next10days_return += next10days_tensor[:,9][j] * 100 * float_ratio

                # sell all the stocks at the end of 10 days, 
                if sum(holds) > 0:
                    # 跌停也按照0.9的收盘价次日平仓
                    if next10days_tensor[:,8][9] <= -0.099:
                        next10days_return += 0.9 * sum(holds) * next10days_tensor[:,8][9] * 100 * float_ratio
                    # 非跌停按照收盘价平仓
                    else:
                        next10days_return += sum(holds) * next10days_tensor[:,8][9] * 100 * float_ratio
                # calculate the return ratio, 
                if next10days_invest <= 0:
                    next10days_roi = 0.0
                else:
                    next10days_roi = (next10days_return / next10days_invest - 1).item()
                # save the (subject, condition, metric, proxy) into the learning space,
                te_subject_list.append(subject)
                te_subject_vector_list.append(subject_vector)
                te_condition_list.append(last10days_tensor.reshape(-1).tolist())
                te_metric_list.append(next10days_roi)
                # print("next10days_roi:", next10days_roi)
                # input()
                te_metric_proxy_list.append(last10days_roi)
                # baseline errors on test data, 
                errors_roi_last10days_fusion_list.append(next10days_roi - last10days_roi)
                if subject_label[index] == 0:
                    te_subject_lr_list.append(subject)
                    te_subject_vector_lr_list.append(subject_vector)
                    te_condition_lr_list.append(last10days_tensor.reshape(-1).tolist())
                    te_metric_lr_list.append(next10days_roi)
                    te_metric_lr_proxy_list.append(last10days_roi)
                    errors_roi_last10days_lr_list.append(next10days_roi - last10days_roi)
                else:
                    te_subject_nn_list.append(subject)
                    te_subject_vector_nn_list.append(subject_vector)
                    te_condition_nn_list.append(last10days_tensor.reshape(-1).tolist())
                    te_metric_nn_list.append(next10days_roi)
                    te_metric_nn_proxy_list.append(last10days_roi)
                    errors_roi_last10days_nn_list.append(next10days_roi - last10days_roi)
                # ---------------------------------------------------------------------------------
                # release the memory,148+79=227, 400 subject, 1000 stocks, 41-61 days,
                # del subject
                # del subject_vector # should not delete the subject vector, because it is used in the float model,
                del next10days_tensor
                del last10days_decisions
        # # release the memory,
        # del subject
        # del subject_vector
        # del next10days_tensor
        # del last10days_decisions
        # del next10days_decisions
        # ---------------------------------------------------------------------------------
    errors['roi_last10days_fusion'].append(errors_roi_last10days_fusion_list)
    errors['roi_last10days_lr'].append(errors_roi_last10days_lr_list)
    errors['roi_last10days_nn'].append(errors_roi_last10days_nn_list)
    # ---------------------------------------------------------------------------------------------------
    # ---------------------------------------------------------------------------------
    tr_subject_list = []
    tr_subject_lr_list = []
    tr_subject_nn_list = []
    tr_subject_vector_list = []
    tr_subject_vector_lr_list = []
    tr_subject_vector_nn_list = []
    tr_condition_list = []
    tr_condition_lr_list = []
    tr_condition_nn_list = []
    tr_metric_list = []
    tr_metric_lr_list = []
    tr_metric_nn_list = []
    tr_metric_proxy_list = []
    tr_metric_lr_proxy_list = []
    tr_metric_nn_proxy_list = []
    for index in range(n_subject_tr): # every trade strategy, 1600 subjects, on train, 
        print(f"train exp: {i_exp}, subject: {index}")
        for day_id in range(10, n_days_train): # every day, 81 days for train, 
            for stock_id in range(n_stock): # every stocks, 3214 stocks, 
                # get the subject, 
                subject = subject_list[index]
                subject_vector = subject_vector_list[index]
                last10days_start_index = stock_id * 89 + day_id - 10
                last10days_end_index = stock_id * 89 + day_id
                next10days_start_index = stock_id * 89 + day_id
                next10days_end_index = stock_id * 89 + day_id + 10
                # get the decision of the subject for the last 10 days, 
                last10days_tensor = torch.tensor(norm_df.iloc[last10days_start_index:last10days_end_index].values, dtype=torch.float32)
                last10days_decisions = subject(last10days_tensor)
                # get the decision of the subject for the next 10 days, 
                next10days_tensor = torch.tensor(norm_df.iloc[next10days_start_index:next10days_end_index].values, dtype=torch.float32)
                next10days_decisions = subject(next10days_tensor)

                # get the reference metric (ROI) by apply the subject to the last 10 days, 
                # decision: 0-买入，1-持有，2-卖出, holds: 0: +1, 1: +0; 2: -1, 
                holds = []
                last10days_return = 0.0
                last10days_invest = 0.0
                for j in range(0, 10):
                    if last10days_decisions[j] == 0: # 买入
                        # 不能买入涨停股票
                        if last10days_tensor[:,9][j] >= 0.099:
                            holds.append(0)
                            continue
                        # 按照开盘价买入1手
                        holds.append(1) # 仓位 +1
                        last10days_return -= last10days_tensor[:,9][j] * 100 # * float_ratio
                        last10days_invest += last10days_tensor[:,9][j] * 100 # * float_ratio
                    elif last10days_decisions[j] == 1: # 持有
                        holds.append(0) # 仓位 +0
                    else: # 卖出
                        if sum(holds) <= 0: # 空仓没得卖
                            holds.append(0) # 仓位 +0
                            continue
                        # 不能卖出跌停股票
                        if last10days_tensor[:,8][j] <= -0.099:
                            holds.append(0) # 仓位 +0
                            continue
                        # 按照收盘价卖出1手
                        holds.append(-1) # 仓位 -1
                        last10days_return += last10days_tensor[:,9][j] * 100

                # sell all the stocks at the end of 10 days, 
                if sum(holds) > 0: # 清仓大甩卖
                    # 跌停也按照0.9的收盘价次日平仓
                    if last10days_tensor[:,8][9] <= -0.099:
                        last10days_return += 0.9 * sum(holds) * last10days_tensor[:,8][9] * 100
                    # 非跌停按照收盘价平仓
                    else:
                        last10days_return += sum(holds) * last10days_tensor[:,8][9] * 100
                # calculate the return ratio, 
                if last10days_invest <= 0:
                    last10days_roi = 0.0
                else:
                    last10days_roi = (last10days_return / last10days_invest - 1).item()

                # get the metric (roi) by apply the subject to the next 10 days, 
                # decision: 0-买入，1-持有，2-卖出, holds: 0: +1, 1: +0; 2: -1, 
                holds = []
                next10days_return = 0.0
                next10days_invest = 0.0
                for j in range(0, 10):
                    # get the float model input, and use the subject to get the float ratio, 
                    float_input = torch.tensor(subject_vector, dtype=torch.float32)
                    if subject_label[index] == 0:
                        # print("linear", float_input.shape)
                        float_ratio = floatmodel_lr(float_input)
                    else:
                        # print("nn", float_input.shape)
                        float_ratio = floatmodel_nn(float_input)
                    if next10days_decisions[j] == 0:
                        # 不能买入涨停股票
                        if next10days_tensor[:,9][j] >= 0.099:
                            holds.append(0)
                            continue
                        # 按照开盘价买入1手
                        holds.append(1)
                        next10days_return -= next10days_tensor[:,9][j] * 100 * float_ratio
                        next10days_invest += next10days_tensor[:,9][j] * 100 * float_ratio
                    elif next10days_decisions[j] == 1:
                        holds.append(0)
                    else:
                        if sum(holds) <= 0:
                            holds.append(0)
                            continue
                        # 不能卖出跌停股票
                        if next10days_tensor[:,8][j] <= -0.099:
                            holds.append(0)
                            continue
                        # 按照收盘价卖出1手
                        holds.append(-1)
                        next10days_return += next10days_tensor[:,9][j] * 100 * float_ratio

                # sell all the stocks at the end of 10 days, 
                if sum(holds) > 0:
                    # 跌停也按照0.9的收盘价次日平仓
                    if next10days_tensor[:,8][9] <= -0.099:
                        next10days_return += 0.9 * sum(holds) * next10days_tensor[:,8][9] * 100 * float_ratio
                    # 非跌停按照收盘价平仓
                    else:
                        next10days_return += sum(holds) * next10days_tensor[:,8][9] * 100 * float_ratio
                # calculate the return ratio, 
                if next10days_invest <= 0:
                    next10days_roi = 0.0
                else:
                    next10days_roi = (next10days_return / next10days_invest - 1).item()
                # ---------------------------------------------------------------------------------
                # add subject, condition, proxy, metric into the learning space,
                tr_subject_list.append(subject)
                tr_subject_vector_list.append(subject_vector)
                tr_condition_list.append(last10days_tensor.reshape(-1).tolist())
                tr_metric_list.append(next10days_roi)
                # print("next10days_roi:", next10days_roi)
                tr_metric_proxy_list.append(last10days_roi)
                if subject_label[index] == 0:
                    tr_subject_lr_list.append(subject)
                    tr_subject_vector_lr_list.append(subject_vector)
                    tr_condition_lr_list.append(last10days_tensor.reshape(-1).tolist())
                    tr_metric_lr_list.append(next10days_roi)
                    tr_metric_lr_proxy_list.append(last10days_roi)
                else:
                    tr_subject_nn_list.append(subject)
                    tr_subject_vector_nn_list.append(subject_vector)
                    tr_condition_nn_list.append(last10days_tensor.reshape(-1).tolist())
                    tr_metric_nn_list.append(next10days_roi)
                    tr_metric_nn_proxy_list.append(last10days_roi)
                # --------------------------------------------------------------------------------
    # -----------------------sampling from the metric space-------------------------------
    # ---------------------------------------------------------------------
    # save 
    # check the data,
    print("tr_subject_list:", len(tr_subject_list))
    print("tr_condition_list:", len(tr_condition_list))
    print("tr_metric_list:", len(tr_metric_list))
    print("tr_metric_proxy_list:", len(tr_metric_proxy_list))
    print("te_subject_list:", len(te_subject_list))
    print("te_condition_list:", len(te_condition_list))
    print("te_metric_list:", len(te_metric_list))
    print("te_metric_proxy_list:", len(te_metric_proxy_list))
    # ---------------------------------------------------------------------

    # ---------------------------evaluation task-----------------------------
    # 在训练集中subject,condition,metric,proxy均和测试集不同
    # 训练模型时直接使用train上的数据，测试时用test上的数据，不需要划分
    s_lr_tr = tr_subject_vector_lr_list
    s_lr_te = te_subject_vector_lr_list
    s_nn_tr = tr_subject_vector_nn_list
    s_nn_te = te_subject_vector_nn_list
    # to numpy and show shape, 
    s_lr_tr = np.array(s_lr_tr)
    s_lr_te = np.array(s_lr_te)
    s_nn_tr = np.array(s_nn_tr)
    s_nn_te = np.array(s_nn_te)
    # print("subject shape:", s_lr_tr.shape, s_lr_te.shape, s_nn_tr.shape, s_nn_te.shape)
    m_lr_tr = np.array(tr_metric_lr_list).reshape(-1, 1)
    m_lr_te = np.array(te_metric_lr_list).reshape(-1, 1)
    m_nn_tr = np.array(tr_metric_nn_list).reshape(-1, 1)
    m_nn_te = np.array(te_metric_nn_list).reshape(-1, 1)
    m_lr_va_te = np.array(te_metric_lr_proxy_list).reshape(-1, 1)
    m_nn_va_te = np.array(te_metric_nn_proxy_list).reshape(-1, 1)
    m_lr_va_tr = np.array(tr_metric_lr_proxy_list).reshape(-1, 1)
    m_nn_va_tr = np.array(tr_metric_nn_proxy_list).reshape(-1, 1)
    # condition,
    # print("condition shape:", tr_condition_lr_list, len(te_condition_list))
    c_lr_tr = np.array(tr_condition_lr_list)
    c_lr_te = np.array(te_condition_lr_list)
    c_nn_tr = np.array(tr_condition_nn_list)
    c_nn_te = np.array(te_condition_nn_list)
    print("c_lr_tr, c_lr_te, c_nn_tr, c_nn_te shape:", c_lr_tr.shape, c_lr_te.shape, c_nn_tr.shape, c_nn_te.shape)
    print("m_lr_tr, m_lr_te, m_nn_tr, m_nn_te shape:", m_lr_tr.shape, m_lr_te.shape, m_nn_tr.shape, m_nn_te.shape)
    print("m_lr_va_tr, m_lr_va_te, m_lr_va_te, m_nn_va_te shape:", m_lr_va_tr.shape, m_lr_va_te.shape, m_nn_va_tr.shape, m_nn_va_te.shape)
    print("s_lr_tr, s_lr_te, s_nn_tr, s_nn_te shape:", s_lr_tr.shape, s_lr_te.shape, s_nn_tr.shape, s_nn_te.shape)
    # scp
    scp_lr_tr = np.concatenate([s_lr_tr, m_lr_va_tr, c_lr_tr], axis=1)
    scp_lr_te = np.concatenate([s_lr_te, m_lr_va_te, c_lr_te], axis=1)
    scp_nn_tr = np.concatenate([s_nn_tr, m_nn_va_tr, c_nn_tr], axis=1)
    scp_nn_te = np.concatenate([s_nn_te, m_nn_va_te, c_nn_te], axis=1)
    # sc
    sc_lr_tr = np.concatenate([s_lr_tr, c_lr_tr], axis=1)
    sc_lr_te = np.concatenate([s_lr_te, c_lr_te], axis=1)
    sc_nn_tr = np.concatenate([s_nn_tr, c_nn_tr], axis=1)
    sc_nn_te = np.concatenate([s_nn_te, c_nn_te], axis=1)
    # cp
    cp_lr_tr = np.concatenate([c_lr_tr, m_lr_va_tr], axis=1)
    cp_lr_te = np.concatenate([c_lr_te, m_lr_va_te], axis=1)
    cp_nn_tr = np.concatenate([c_nn_tr, m_nn_va_tr], axis=1)
    cp_nn_te = np.concatenate([c_nn_te, m_nn_va_te], axis=1)
    # sp
    sp_lr_te = np.concatenate([s_lr_te, m_lr_va_te], axis=1)
    sp_nn_te = np.concatenate([s_nn_te, m_nn_va_te], axis=1)
    sp_lr_tr = np.concatenate([s_lr_tr, m_lr_va_tr], axis=1)
    sp_nn_tr = np.concatenate([s_nn_tr, m_nn_va_tr], axis=1)
    # ---------------------------------------------------------------------
    
    # ----------------------- em -----------------------
    for model_name in model_names:
        print(f"model_name: {model_name}")
        if model_name == 'linear':
            from sklearn.linear_model import LinearRegression
            # s, c, p
            lrmodel = LinearRegression()
            nnmodel = LinearRegression()
            lrmodel.fit(scp_lr_tr, m_lr_tr)
            nnmodel.fit(scp_nn_tr, m_nn_tr)
            # s
            lrmodel_s = LinearRegression()
            nnmodel_s = LinearRegression()
            lrmodel_s.fit(s_lr_tr, m_lr_tr)
            nnmodel_s.fit(s_nn_tr, m_nn_tr)
            # p
            lrmodel_p = LinearRegression()
            nnmodel_p = LinearRegression()
            lrmodel_p.fit(m_lr_va_tr, m_lr_tr)
            nnmodel_p.fit(m_nn_va_tr, m_nn_tr)
            # c
            lrmodel_c = LinearRegression()
            nnmodel_c = LinearRegression()
            lrmodel_c.fit(c_lr_tr, m_lr_tr)
            nnmodel_c.fit(c_nn_tr, m_nn_tr)
            # sc 
            lrmodel_sc = LinearRegression()
            nnmodel_sc = LinearRegression()
            lrmodel_sc.fit(sc_lr_te, m_lr_te)
            nnmodel_sc.fit(sc_nn_te, m_nn_te)
            # sp
            lrmodel_sp = LinearRegression()
            nnmodel_sp = LinearRegression()
            lrmodel_sp.fit(sp_lr_te, m_lr_te)
            nnmodel_sp.fit(sp_nn_te, m_nn_te)
            # cp
            lrmodel_cp = LinearRegression()
            nnmodel_cp = LinearRegression()
            lrmodel_cp.fit(cp_lr_te, m_lr_te)
            nnmodel_cp.fit(cp_nn_te, m_nn_te)

            lr_error = m_lr_te - lrmodel.predict(scp_lr_te)
            nn_error = m_nn_te - nnmodel.predict(scp_nn_te)
            # s
            lr_error_subject = m_lr_te - lrmodel_s.predict(s_lr_te)
            nn_error_subject = m_nn_te - nnmodel_s.predict(s_nn_te)
            # p
            lr_error_proxy = m_lr_te - lrmodel_p.predict(m_lr_va_te)
            nn_error_proxy = m_nn_te - nnmodel_p.predict(m_nn_va_te)
            # c
            lr_error_c = m_lr_te - lrmodel_c.predict(c_lr_te)
            nn_error_c = m_nn_te - nnmodel_c.predict(c_nn_te)
            # sc
            lr_error_sc = m_lr_te - lrmodel_sc.predict(sc_lr_te)
            nn_error_sc = m_nn_te - nnmodel_sc.predict(sc_nn_te)
            # sp
            lr_error_sp = m_lr_te - lrmodel_sp.predict(sp_lr_te)
            nn_error_sp = m_nn_te - nnmodel_sp.predict(sp_nn_te)
            # cp
            lr_error_cp = m_lr_te - lrmodel_cp.predict(cp_lr_te)
            nn_error_cp = m_nn_te - nnmodel_cp.predict(cp_nn_te)

        elif model_name == 'mlp':
            from sklearn.neural_network import MLPRegressor
            # s, c, p
            # use GridSearch to find the best parameters for MLPRegressor
            from sklearn.model_selection import GridSearchCV
            params = {
                'hidden_layer_sizes': [(100,), (50, 50), (100, 50), (50, 100)],
                # 'activation': ['relu', 'tanh', 'logistic'],
                # 'solver': ['adam', 'sgd', 'lbfgs'],
                'alpha': [0.0001, 0.001, 0.01],
                # 'learning_rate': ['constant', 'adaptive'],
                'max_iter': [1000, 2000, 3000],
                'random_state': [42]
            }
            lrmodel = GridSearchCV(MLPRegressor(), params, cv=3)
            nnmodel = GridSearchCV(MLPRegressor(), params, cv=3)
            # lrmodel = MLPRegressor()
            # nnmodel = MLPRegressor()
            lrmodel.fit(scp_lr_tr, m_lr_tr)
            nnmodel.fit(scp_nn_tr, m_nn_tr)
            # s
            lrmodel_s = GridSearchCV(MLPRegressor(), params, cv=3)
            nnmodel_s = GridSearchCV(MLPRegressor(), params, cv=3)
            # lrmodel_s = MLPRegressor()
            # nnmodel_s = MLPRegressor()
            lrmodel_s.fit(s_lr_tr, m_lr_tr)
            nnmodel_s.fit(s_nn_tr, m_nn_tr)
            # p
            lrmodel_p = GridSearchCV(MLPRegressor(), params, cv=3)
            nnmodel_p = GridSearchCV(MLPRegressor(), params, cv=3)
            # lrmodel_p = MLPRegressor()
            # nnmodel_p = MLPRegressor()
            lrmodel_p.fit(m_lr_va_tr, m_lr_tr)
            nnmodel_p.fit(m_nn_va_tr, m_nn_tr)
            # c
            lrmodel_c = GridSearchCV(MLPRegressor(), params, cv=3)
            nnmodel_c = GridSearchCV(MLPRegressor(), params, cv=3)
            # lrmodel_c = MLPRegressor()
            # nnmodel_c = MLPRegressor()
            lrmodel_c.fit(c_lr_tr, m_lr_tr)
            nnmodel_c.fit(c_nn_tr, m_nn_tr)
            # sc
            lrmodel_sc = GridSearchCV(MLPRegressor(), params, cv=3)
            nnmodel_sc = GridSearchCV(MLPRegressor(), params, cv=3)
            # lrmodel_sc = MLPRegressor()
            # nnmodel_sc = MLPRegressor()
            lrmodel_sc.fit(sc_lr_te, m_lr_te)
            nnmodel_sc.fit(sc_nn_te, m_nn_te)
            # sp
            lrmodel_sp = GridSearchCV(MLPRegressor(), params, cv=3)
            nnmodel_sp = GridSearchCV(MLPRegressor(), params, cv=3)
            # lrmodel_sp = MLPRegressor()
            # nnmodel_sp = MLPRegressor()
            lrmodel_sp.fit(sp_lr_te, m_lr_te)
            nnmodel_sp.fit(sp_nn_te, m_nn_te)
            # cp
            lrmodel_cp = GridSearchCV(MLPRegressor(), params, cv=3)
            nnmodel_cp = GridSearchCV(MLPRegressor(), params, cv=3)
            # lrmodel_cp = MLPRegressor()
            # nnmodel_cp = MLPRegressor()
            lrmodel_cp.fit(cp_lr_te, m_lr_te)
            nnmodel_cp.fit(cp_nn_te, m_nn_te)

        elif model_name == 'svm':
            from sklearn.svm import SVR
            # s, c, p
            lrmodel = SVR()
            nnmodel = SVR()
            lrmodel.fit(scp_lr_tr, m_lr_tr)
            nnmodel.fit(scp_nn_tr, m_nn_tr)
            # s
            lrmodel_s = SVR()
            nnmodel_s = SVR()
            lrmodel_s.fit(s_lr_tr, m_lr_tr)
            nnmodel_s.fit(s_nn_tr, m_nn_tr)
            # p
            lrmodel_p = SVR()
            nnmodel_p = SVR()
            lrmodel_p.fit(m_lr_va_tr, m_lr_tr)
            nnmodel_p.fit(m_nn_va_tr, m_nn_tr)
            # c
            lrmodel_c = SVR()
            nnmodel_c = SVR()
            lrmodel_c.fit(c_lr_tr, m_lr_tr)
            nnmodel_c.fit(c_nn_tr, m_nn_tr)
            # sc
            lrmodel_sc = SVR()
            nnmodel_sc = SVR()
            lrmodel_sc.fit(sc_lr_te, m_lr_te)
            nnmodel_sc.fit(sc_nn_te, m_nn_te)
            # sp
            lrmodel_sp = SVR()
            nnmodel_sp = SVR()
            lrmodel_sp.fit(sp_lr_te, m_lr_te)
            nnmodel_sp.fit(sp_nn_te, m_nn_te)
            # cp
            lrmodel_cp = SVR()
            nnmodel_cp = SVR()
            lrmodel_cp.fit(cp_lr_te, m_lr_te)
            nnmodel_cp.fit(cp_nn_te, m_nn_te)
        elif model_name == 'rf': 
            from sklearn.ensemble import RandomForestRegressor
            # s, c, p
            # use GridSearch to find the best parameters for RandomForestRegressor
            from sklearn.model_selection import GridSearchCV
            params = {
                'n_estimators': [100, 200, 300],
                'max_depth': [10, 20, 30],
                'min_samples_split': [2, 5, 10],
                'min_samples_leaf': [1, 2, 4],
                'max_features': ['auto', 'sqrt'],
                'bootstrap': [True, False]
            }
            lrmodel = GridSearchCV(RandomForestRegressor(), params, cv=3)
            nnmodel = GridSearchCV(RandomForestRegressor(), params, cv=3)
            # lrmodel = RandomForestRegressor()
            # nnmodel = RandomForestRegressor()
            lrmodel.fit(scp_lr_tr, m_lr_tr)
            nnmodel.fit(scp_nn_tr, m_nn_tr)
            # s
            lrmodel_s = GridSearchCV(RandomForestRegressor(), params, cv=3)
            nnmodel_s = GridSearchCV(RandomForestRegressor(), params, cv=3)
            # lrmodel_s = RandomForestRegressor()
            # nnmodel_s = RandomForestRegressor()
            lrmodel_s.fit(s_lr_tr, m_lr_tr)
            nnmodel_s.fit(s_nn_tr, m_nn_tr)
            # p
            # lrmodel_p = RandomForestRegressor()
            # nnmodel_p = RandomForestRegressor()
            lrmodel_p = GridSearchCV(RandomForestRegressor(), params, cv=3)
            nnmodel_p = GridSearchCV(RandomForestRegressor(), params, cv=3)
            lrmodel_p.fit(m_lr_va_tr, m_lr_tr)
            nnmodel_p.fit(m_nn_va_tr, m_nn_tr)
            # c
            # lrmodel_c = RandomForestRegressor()
            # nnmodel_c = RandomForestRegressor()
            lrmodel_c = GridSearchCV(RandomForestRegressor(), params, cv=3)
            nnmodel_c = GridSearchCV(RandomForestRegressor(), params, cv=3)
            lrmodel_c.fit(c_lr_tr, m_lr_tr)
            nnmodel_c.fit(c_nn_tr, m_nn_tr)
            # sc
            # lrmodel_sc = RandomForestRegressor()
            # nnmodel_sc = RandomForestRegressor()
            lrmodel_sc = GridSearchCV(RandomForestRegressor(), params, cv=3)
            nnmodel_sc = GridSearchCV(RandomForestRegressor(), params, cv=3)
            lrmodel_sc.fit(sc_lr_te, m_lr_te)
            nnmodel_sc.fit(sc_nn_te, m_nn_te)
            # sp, 
            # lrmodel_sp = RandomForestRegressor()
            # nnmodel_sp = RandomForestRegressor()
            lrmodel_sp = GridSearchCV(RandomForestRegressor(), params, cv=3)
            nnmodel_sp = GridSearchCV(RandomForestRegressor(), params, cv=3)
            lrmodel_sp.fit(sp_lr_te, m_lr_te)
            nnmodel_sp.fit(sp_nn_te, m_nn_te)
            # cp, 
            # lrmodel_cp = RandomForestRegressor()
            # nnmodel_cp = RandomForestRegressor()
            lrmodel_cp = GridSearchCV(RandomForestRegressor(), params, cv=3)
            nnmodel_cp = GridSearchCV(RandomForestRegressor(), params, cv=3)
            lrmodel_cp.fit(cp_lr_te, m_lr_te)
            nnmodel_cp.fit(cp_nn_te, m_nn_te)
        elif model_name == 'lgbm':
            import lightgbm as lgb
            # s, c, p
            # use GridSearch to find the best parameters for LGBMRegressor
            from sklearn.model_selection import GridSearchCV
            params = {
                # 'boosting_type': ['gbdt', 'dart'],
                'num_leaves': [31, 63],
                'max_depth': [-1, 10, 20],
                'learning_rate': [0.01, 0.1, 0.2],
                'n_estimators': [100, 200],
                # 'subsample_for_bin': [20000, 50000],
            }
            lrmodel = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            nnmodel = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel = lgb.LGBMRegressor()
            # nnmodel = lgb.LGBMRegressor()
            lrmodel.fit(scp_lr_tr, m_lr_tr)
            nnmodel.fit(scp_nn_tr, m_nn_tr)
            # s
            lrmodel_s = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_s = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_s = lgb.LGBMRegressor()
            # nnmodel_s = lgb.LGBMRegressor()
            lrmodel_s.fit(s_lr_tr, m_lr_tr)
            nnmodel_s.fit(s_nn_tr, m_nn_tr)
            # p
            lrmodel_p = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_p = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_p = lgb.LGBMRegressor()
            # nnmodel_p = lgb.LGBMRegressor()
            lrmodel_p.fit(m_lr_va_tr, m_lr_tr)
            nnmodel_p.fit(m_nn_va_tr, m_nn_tr)
            # c
            lrmodel_c = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_c = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_c = lgb.LGBMRegressor()
            # nnmodel_c = lgb.LGBMRegressor()
            lrmodel_c.fit(c_lr_tr, m_lr_tr)
            nnmodel_c.fit(c_nn_tr, m_nn_tr)
            # sc
            lrmodel_sc = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_sc = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_sc = lgb.LGBMRegressor()
            # nnmodel_sc = lgb.LGBMRegressor()
            lrmodel_sc.fit(sc_lr_te, m_lr_te)
            nnmodel_sc.fit(sc_nn_te, m_nn_te)
            # sp
            lrmodel_sp = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_sp = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_sp = lgb.LGBMRegressor()
            # nnmodel_sp = lgb.LGBMRegressor()
            lrmodel_sp.fit(sp_lr_te, m_lr_te)
            nnmodel_sp.fit(sp_nn_te, m_nn_te)
            # cp
            lrmodel_cp = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_cp = GridSearchCV(lgb.LGBMRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_cp = lgb.LGBMRegressor()
            # nnmodel_cp = lgb.LGBMRegressor()
            lrmodel_cp.fit(cp_lr_te, m_lr_te)
            nnmodel_cp.fit(cp_nn_te, m_nn_te)

        elif model_name == 'xgb':
            import xgboost as xgb
            # s, c, p
            # use GridSearch to find the best parameters for XGBRegressor
            from sklearn.model_selection import GridSearchCV
            params = {
                'n_estimators': [100, 200],
                'max_depth': [3, 5, 7],
                'learning_rate': [0.01, 0.1],
                'subsample': [0.8, 1.0],
                'colsample_bytree': [0.8, 1.0],
            }
            lrmodel = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            nnmodel = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel = xgb.XGBRegressor()
            # nnmodel = xgb.XGBRegressor()
            lrmodel.fit(scp_lr_tr, m_lr_tr)
            nnmodel.fit(scp_nn_tr, m_nn_tr)
            # s
            lrmodel_s = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_s = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_s = xgb.XGBRegressor()
            # nnmodel_s = xgb.XGBRegressor()
            lrmodel_s.fit(s_lr_tr, m_lr_tr)
            nnmodel_s.fit(s_nn_tr, m_nn_tr)
            # p
            lrmodel_p = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_p = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_p = xgb.XGBRegressor()
            # nnmodel_p = xgb.XGBRegressor()
            lrmodel_p.fit(m_lr_va_tr, m_lr_tr)
            nnmodel_p.fit(m_nn_va_tr, m_nn_tr)
            # c
            lrmodel_c = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_c = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_c = xgb.XGBRegressor()
            # nnmodel_c = xgb.XGBRegressor()
            lrmodel_c.fit(c_lr_tr, m_lr_tr)
            nnmodel_c.fit(c_nn_tr, m_nn_tr)
            # sc
            lrmodel_sc = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_sc = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_sc = xgb.XGBRegressor()
            # nnmodel_sc = xgb.XGBRegressor()
            lrmodel_sc.fit(sc_lr_te, m_lr_te)
            nnmodel_sc.fit(sc_nn_te, m_nn_te)
            # sp
            lrmodel_sp = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_sp = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_sp = xgb.XGBRegressor()
            # nnmodel_sp = xgb.XGBRegressor()
            lrmodel_sp.fit(sp_lr_te, m_lr_te)
            nnmodel_sp.fit(sp_nn_te, m_nn_te)
            # cp
            lrmodel_cp = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_cp = GridSearchCV(xgb.XGBRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel_cp = xgb.XGBRegressor()
            # nnmodel_cp = xgb.XGBRegressor()
            lrmodel_cp.fit(cp_lr_te, m_lr_te)
            nnmodel_cp.fit(cp_nn_te, m_nn_te)

        elif model_name == 'catboost':
            from catboost import CatBoostRegressor
            # use GridSearch to find the best parameters for CatBoostRegressor
            from sklearn.model_selection import GridSearchCV
            params = {
                'iterations': [100, 200],
                'depth': [6, 8],
                'learning_rate': [0.01, 0.1],
                'l2_leaf_reg': [1, 3],
                'border_count': [32, 64],
            }
            # s, c, p
            lrmodel = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            nnmodel = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            # lrmodel = CatBoostRegressor()
            # nnmodel = CatBoostRegressor()
            lrmodel.fit(scp_lr_tr, m_lr_tr, verbose=0)
            nnmodel.fit(scp_nn_tr, m_nn_tr, verbose=0)
            # s
            # lrmodel_s = CatBoostRegressor()
            # nnmodel_s = CatBoostRegressor()
            lrmodel_s = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_s = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            lrmodel_s.fit(s_lr_tr, m_lr_tr, verbose=0)
            nnmodel_s.fit(s_nn_tr, m_nn_tr, verbose=0)
            # p
            # lrmodel_p = CatBoostRegressor()
            # nnmodel_p = CatBoostRegressor()
            lrmodel_p = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_p = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            lrmodel_p.fit(m_lr_va_tr, m_lr_tr, verbose=0)
            nnmodel_p.fit(m_nn_va_tr, m_nn_tr, verbose=0)
            # c
            # lrmodel_c = CatBoostRegressor()
            # nnmodel_c = CatBoostRegressor()
            lrmodel_c = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_c = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            lrmodel_c.fit(c_lr_tr, m_lr_tr, verbose=0)
            nnmodel_c.fit(c_nn_tr, m_nn_tr, verbose=0)
            # sc
            # lrmodel_sc = CatBoostRegressor()
            # nnmodel_sc = CatBoostRegressor()
            lrmodel_sc = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_sc = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            lrmodel_sc.fit(sc_lr_te, m_lr_te, verbose=0)
            nnmodel_sc.fit(sc_nn_te, m_nn_te, verbose=0)
            # sp
            # lrmodel_sp = CatBoostRegressor()
            # nnmodel_sp = CatBoostRegressor()
            lrmodel_sp = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_sp = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            lrmodel_sp.fit(sp_lr_te, m_lr_te, verbose=0)
            nnmodel_sp.fit(sp_nn_te, m_nn_te, verbose=0)
            # cp
            # lrmodel_cp = CatBoostRegressor()
            # nnmodel_cp = CatBoostRegressor()
            lrmodel_cp = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            nnmodel_cp = GridSearchCV(CatBoostRegressor(), params, cv=3, n_jobs=-1)
            lrmodel_cp.fit(cp_lr_te, m_lr_te, verbose=0)
            nnmodel_cp.fit(cp_nn_te, m_nn_te, verbose=0)

        elif model_name == 'tabpfn':
            from tabpfn import TabPFNClassifier, TabPFNRegressor
            # s, c, p
            lrmodel = TabPFNRegressor()
            nnmodel = TabPFNRegressor()
            lrmodel.fit(scp_lr_tr, m_lr_tr)
            nnmodel.fit(scp_nn_tr, m_nn_tr)
            # s
            lrmodel_s = TabPFNRegressor()
            nnmodel_s = TabPFNRegressor()
            lrmodel_s.fit(s_lr_tr, m_lr_tr)
            nnmodel_s.fit(s_nn_tr, m_nn_tr)
            # p
            lrmodel_p = TabPFNRegressor()
            nnmodel_p = TabPFNRegressor()
            lrmodel_p.fit(m_lr_va_tr, m_lr_tr)
            nnmodel_p.fit(m_nn_va_tr, m_nn_tr)
            # c
            lrmodel_c = TabPFNRegressor()
            nnmodel_c = TabPFNRegressor()
            lrmodel_c.fit(c_lr_tr, m_lr_tr)
            nnmodel_c.fit(c_nn_tr, m_nn_tr)
            # sc
            lrmodel_sc = TabPFNRegressor()
            nnmodel_sc = TabPFNRegressor()
            lrmodel_sc.fit(sc_lr_te, m_lr_te)
            nnmodel_sc.fit(sc_nn_te, m_nn_te)
            # sp
            lrmodel_sp = TabPFNRegressor()
            nnmodel_sp = TabPFNRegressor()
            lrmodel_sp.fit(sp_lr_te, m_lr_te)
            nnmodel_sp.fit(sp_nn_te, m_nn_te)
            # cp
            lrmodel_cp = TabPFNRegressor()
            nnmodel_cp = TabPFNRegressor()
            lrmodel_cp.fit(cp_lr_te, m_lr_te)
            nnmodel_cp.fit(cp_nn_te, m_nn_te)

        else: 
            raise ValueError("model_name is not supported!")
        
        # shape of the error,
        print("lr_error, nn_error shape:", lr_error.shape, nn_error.shape)
        print("lr_error_subject, nn_error_subject shape:", lr_error_subject.shape, nn_error_subject.shape)
        print("lr_error_proxy, nn_error_proxy shape:", lr_error_proxy.shape, nn_error_proxy.shape)
        # ---------------------------------------------------------------------------------------------------

        # merge the lr error and nn error, 
        error_list = np.concatenate([lr_error, nn_error])
        error_list_subject = np.concatenate([lr_error_subject, nn_error_subject])
        error_list_proxy = np.concatenate([lr_error_proxy, nn_error_proxy])
        # shape, 
        # print("all, subject, proxy shape:", error_list, error_list_subject, error_list_proxy)

        # error, 
        errors[f"{model_name}_fusion"].append(error_list)
        errors[f"{model_name}_lr"].append(lr_error)
        errors[f"{model_name}_nn"].append(nn_error)
        # s error, 
        errors_s[f"{model_name}_fusion"].append(error_list_subject)
        errors_s[f"{model_name}_lr"].append(lr_error_subject)
        errors_s[f"{model_name}_nn"].append(nn_error_subject)
        # p error, 
        errors_p[f"{model_name}_fusion"].append(error_list_proxy)
        errors_p[f"{model_name}_lr"].append(lr_error_proxy)
        errors_p[f"{model_name}_nn"].append(nn_error_proxy)
        # c error,
        errors_c[f"{model_name}_fusion"].append(lr_error_c)
        errors_c[f"{model_name}_lr"].append(nn_error_c)
        errors_c[f"{model_name}_nn"].append(lr_error_c)
        # sc error,
        errors_sc[f"{model_name}_fusion"].append(lr_error_sc)
        errors_sc[f"{model_name}_lr"].append(nn_error_sc)
        errors_sc[f"{model_name}_nn"].append(lr_error_sc)
        # sp error,
        errors_sp[f"{model_name}_fusion"].append(lr_error_sp)
        errors_sp[f"{model_name}_lr"].append(nn_error_sp)
        errors_sp[f"{model_name}_nn"].append(lr_error_sp)
        # cp error,
        errors_cp[f"{model_name}_fusion"].append(lr_error_cp)
        errors_cp[f"{model_name}_lr"].append(nn_error_cp)
        errors_cp[f"{model_name}_nn"].append(lr_error_cp)
        # ---------------------------------------------------------------------------------------------------

        # reshape the error_list to 1-d array, 
        error_list = error_list.reshape(-1)
        error_list = winsorize(error_list)
        lr_error = lr_error.reshape(-1)
        lr_error = winsorize(lr_error)
        nn_error = nn_error.reshape(-1)
        nn_error = winsorize(nn_error)
        # shape, 
        # print("error_list shape:", error_list.shape)

        # ------iid check by central limit theorem-------
        # (1) randomly select half errors, total 30 groups, 
        n_group = 30
        group_means = []
        group_means_lr = []
        group_means_nn = []
        for i in range(n_group):
            # randomly select half errors from error_list, 
            selected_errors = np.random.choice(error_list, int(len(error_list)/2))
            selected_errors_lr = np.random.choice(lr_error, int(len(lr_error)/2))
            selected_errors_nn = np.random.choice(nn_error, int(len(nn_error)/2))
            # calculate the mean of the error, 
            group_means.append(np.mean(selected_errors))
            group_means_lr.append(np.mean(selected_errors_lr))
            group_means_nn.append(np.mean(selected_errors_nn))

        # (2) mean of each group, should be a normal distribution, 
        # use kurtosistest test to check the normal distribution, 
        from scipy.stats import normaltest
        stat, p = normaltest(group_means)
        stat_lr, p_lr = normaltest(group_means_lr)
        stat_nn, p_nn = normaltest(group_means_nn)
        # model_name = "linear", test_name = "iid", target_name = "rocauc", subject_name = "fusion"
        p_values[f"{model_name}_iid_fusion"].append(p)
        p_values[f"{model_name}_iid_lr"].append(p_lr)
        p_values[f"{model_name}_iid_nn"].append(p_nn)

        # ------id check by ks test-------
        n_sample_per_group = 30
        n_group = len(error_list) // n_sample_per_group
        n_group_lr = len(lr_error) // n_sample_per_group
        n_group_nn = len(nn_error) // n_sample_per_group
        # randomly split the error_list into n_group groups, 
        group_errors = np.array_split(error_list, n_group)
        group_errors_lr = np.array_split(lr_error, n_group_lr)
        group_errors_nn = np.array_split(nn_error, n_group_nn)

        # transformation
        # use ks test pair-wise to check the whether n groups are from the same distribution, 
        from scipy.stats import kruskal
        # print("group_errors:", len(group_errors), group_errors)
        stat, p = kruskal(*group_errors)
        stat_lr, p_lr = kruskal(*group_errors_lr)
        stat_nn, p_nn = kruskal(*group_errors_nn)
        # model_name = "linear", test_name = "id", target_name = "rocauc", subject_name = "fusion"
        p_values[f"{model_name}_id_fusion"].append(p)
        p_values[f"{model_name}_id_lr"].append(p_lr)
        p_values[f"{model_name}_id_nn"].append(p_nn)
        
        # ------bias check by something-------
        # null hypothesis: check the bias of the error is 0,
        from scipy.stats import ttest_1samp
        stat, p = ttest_1samp(error_list, 0)
        stat_lr, p_lr = ttest_1samp(lr_error, 0)
        stat_nn, p_nn = ttest_1samp(nn_error, 0)
        # model_name = "linear", test_name = "unbias", target_name = "rocauc", subject_name = "fusion"
        p_values[f"{model_name}_bias_fusion"].append(p)
        p_values[f"{model_name}_bias_lr"].append(p_lr)
        p_values[f"{model_name}_bias_nn"].append(p_nn)
        # ---------------------------------------------------------------------------------------------------
    # release the memory,
    del tr_subject_list
    del tr_subject_lr_list
    del tr_subject_nn_list
    del tr_subject_vector_list
    del tr_subject_vector_lr_list
    del tr_subject_vector_nn_list
    del tr_condition_list
    del tr_condition_lr_list
    del tr_condition_nn_list
    del tr_metric_list
    del tr_metric_lr_list
    del tr_metric_nn_list
    del tr_metric_proxy_list
    del tr_metric_lr_proxy_list
    del tr_metric_nn_proxy_list
    del te_subject_list
    del te_subject_lr_list
    del te_subject_nn_list
    del te_subject_vector_list
    del te_subject_vector_lr_list
    del te_subject_vector_nn_list
    del te_condition_list
    del te_condition_lr_list
    del te_condition_nn_list
    del te_metric_list
    del te_metric_lr_list
    del te_metric_nn_list
    del te_metric_proxy_list
    del te_metric_lr_proxy_list
    del te_metric_nn_proxy_list
    # ---------------------------------------------------------------------------------------------------
print("complete evaluation!")
# ---------------------------evaluation task-----------------------------
# save the p_values, errors, errors_subject, errors_proxy, (dictories file)
import pickle
with open('./expdata/' + dataset_name + '/p_values.pkl', 'wb') as f:
    pickle.dump(p_values, f)
with open('./expdata/' + dataset_name + '/errors.pkl', 'wb') as f:
    pickle.dump(errors, f)
with open('./expdata/' + dataset_name + '/errors_s.pkl', 'wb') as f:
    pickle.dump(errors_s, f)
with open('./expdata/' + dataset_name + '/errors_p.pkl', 'wb') as f:
    pickle.dump(errors_p, f)
with open('./expdata/' + dataset_name + '/errors_c.pkl', 'wb') as f:
    pickle.dump(errors_c, f)
with open('./expdata/' + dataset_name + '/errors_sc.pkl', 'wb') as f:
    pickle.dump(errors_sc, f)
with open('./expdata/' + dataset_name + '/errors_sp.pkl', 'wb') as f:
    pickle.dump(errors_sp, f)
with open('./expdata/' + dataset_name + '/errors_cp.pkl', 'wb') as f:
    pickle.dump(errors_cp, f)
print("complete write!")
# ---------------------------evaluation task-----------------------------
# load the p_values, errors, errors_subject, errors_proxy, (dictories file)
import pickle
with open('./expdata/' + dataset_name + '/p_values.pkl', 'rb') as f:
    p_values = pickle.load(f)
with open('./expdata/' + dataset_name + '/errors.pkl', 'rb') as f:
    errors = pickle.load(f)
with open('./expdata/' + dataset_name + '/errors_s.pkl', 'rb') as f:
    errors_subject = pickle.load(f)
with open('./expdata/' + dataset_name + '/errors_p.pkl', 'rb') as f:
    errors_proxy = pickle.load(f)
with open('./expdata/' + dataset_name + '/errors_c.pkl', 'rb') as f:
    errors_c = pickle.load(f)
with open('./expdata/' + dataset_name + '/errors_sc.pkl', 'rb') as f:
    errors_sc = pickle.load(f)
with open('./expdata/' + dataset_name + '/errors_sp.pkl', 'rb') as f:
    errors_sp = pickle.load(f)
with open('./expdata/' + dataset_name + '/errors_cp.pkl', 'rb') as f:
    errors_cp = pickle.load(f)
print("complete load!")
# ---------------------------evaluation task-----------------------------