
import os
os.system("pip install --upgrade scikit-learn")

import torch
from torch import nn
import argparse
from dnamite.models import DNAMiteRegressor
import torch
import time
import numpy as np
import pandas as pd

import sklearn

def main():
    
    parser = argparse.ArgumentParser(description="Train a model")
    parser.add_argument('--data_name', default='only_main_data', type=str, help='type of the data to use')
    args = parser.parse_args()

    path = '../../Dataset/Numerical-Studies/'
    dataset = torch.load(path+args.data_name+'.pt', weights_only = True)

    length = dataset['X_train'].size()[0]
    mse_list = np.zeros(length)
    start_time = time.time()
    
    for i in range(length):
        X_train = pd.DataFrame(dataset['X_train'][i])
        y_train = np.asarray(dataset['y_train'][i]).reshape(-1)
    
        model = DNAMiteRegressor()
        model.fit(X_train, y_train)
    
        pred = model.predict(pd.DataFrame(dataset['X_test'][i]))
        mse_list[i] = np.mean((pred - np.asarray(dataset['y_test'][i]).reshape(-1))**2)

    end_time = time.time()
    elapsed_time = end_time - start_time
    print(mse_list)
    print(f"Program executed in {elapsed_time:.4f} seconds")
    print(f"Mean of MSE {np.mean(mse_list)}")
    print(f"Std of MSE {np.std(mse_list)}")
    
if __name__ == "__main__":
    main()


