
# # Comparsion models for competing risks
# In this script we train the different models for competing risks
import sys
from experiment import *
from generate import *

# Open dataset
random_seed = 42
mode = sys.argv[1]

try:
    if int(mode) == 0:
        mode = 'rand' 
    elif int(mode) == 1:
        mode = 'obs'
except: pass

print("Script running experiments on generated data with seed =", random_seed)
for size in [300, 30000]:
    x, a, t, e, _ = generate(random_seed, size = size, mode = mode) 

    # Normalise data
    x, t, e, a = StandardScaler().fit_transform(x.values).astype(float),\
                t.values.astype(float), e.values.astype(int), a.values.astype(int)

    # Hyperparameters and evaluations
    max_epochs = 1000
    grid_search = 100
    layers = [[50] * (j + 1) for j in range(3)]

    # Clustering
    param_grid = {
        'n_clusters': [3]
    }
    KmeansExperiment.create(param_grid, n_iter = grid_search, path = 'Results_ntc/generatesize_{}={}+{}_kmeans'.format(mode, random_seed, size)).train(x, t, e, a)

    # VirtualTwins
    param_grid = {
        'n_clusters': [3],
        'max_depth': [3, 5, None],
        'min_samples_split': [6, 12, 24],
    }
    VirtualTwinsExperiment.create(param_grid, n_iter = grid_search, path = 'Results_ntc/generatesize_{}={}+{}_twins'.format(mode, random_seed, size)).train(x, t, e, a)

    # NTC Competing risk
    param_grid = {
        'epochs': [max_epochs],
        'learning_rate' : [1e-3, 1e-4],
        'batch': [100, 250],

        'layers_surv': layers,
        'representation': [10, 25, 50],
        'k': [3],
        'layers' : layers,
        'act': ['Tanh'],
        'gamma': [0],
        'correct' : [True]
    }
    NTCExperiment.create(param_grid, n_iter = grid_search, path = 'Results_ntc/generatesize_{}={}+{}_ntc'.format(mode, random_seed, size)).train(x, t, e, a)

    param_grid['correct'] = [False]
    NTCExperiment.create(param_grid, n_iter = grid_search, path = 'Results_ntc/generatesize_{}={}+{}_ntc+uncorrect'.format(mode, random_seed, size)).train(x, t, e, a)


    # CMHE
    param_grid = {
        'epochs': [max_epochs],
        'learning_rate' : [1e-3, 1e-4],
        'batch': [100, 250],

        'layers': layers,
        'k': [1],
        'g': [3],
    }
    CMHEExperiment.create(param_grid, n_iter = grid_search, path = 'Results_ntc/generatesize_{}={}+{}_cmhe+g'.format(mode, random_seed, size)).train(x, t, e, a)

    param_grid = {
        'epochs': [max_epochs],
        'learning_rate' : [1e-3, 1e-4],
        'batch': [100, 250],

        'layers': layers,
        'k': [3],
        'g': [1],
    }
    CMHEExperiment.create(param_grid, n_iter = grid_search, path = 'Results_ntc/generatesize_{}={}+{}_cmhe+k'.format(mode, random_seed, size)).train(x, t, e, a)

    param_grid = {
        'epochs': [max_epochs],
        'learning_rate' : [1e-3, 1e-4],
        'batch': [100, 250],

        'layers': layers,
        'k': [3 // 2 + 1],
        'g': [3 // 2 + 1],
    }
    CMHEExperiment.create(param_grid, n_iter = grid_search, path = 'Results_ntc/generatesize_{}={}+{}_cmhe+gk'.format(mode, random_seed, size)).train(x, t, e, a)