import sys
sys.path.append("../")
import os
os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID"

import torch
import torch.nn as nn
import random
import numpy as np

from HyperSINDy import Net
from baseline import Trainer
from library_utils import Library
from Datasets import SyntheticDataset
from other import init_weights, set_random_seed

"""
Train HyperSINDy on lorenz
"""

import argparse
def parse_args():
    parser = argparse.ArgumentParser(description="Template")
    parser.add_argument('-S1', '--s1', default=0, type=int, help="Exp set 1.")
    parser.add_argument('-S2', '--s2', default=0, type=int, help="Exp set 2.")
    parser.add_argument('-S3', '--s3', default=0, type=int, help="Exp set 3.")
    parser.add_argument('-S4', '--s4', default=0, type=int, help="Exp set 1.")
    parser.add_argument('-S5', '--s5', default=0, type=int, help="Exp set 2.")
    parser.add_argument('-S6', '--s6', default=0, type=int, help="Exp set 3.")
    parser.add_argument('-S7', '--s7', default=0, type=int, help="Exp set 1.")
    parser.add_argument('-S8', '--s8', default=0, type=int, help="Exp set 2.")
    parser.add_argument('-S9', '--s9', default=0, type=int, help="Exp set 3.")
    parser.add_argument('-S10', '--s10', default=0, type=int, help="Exp set 3.")
    parser.add_argument('-D1', '--d1', default=1, type=int, help="Device for exp 1.")
    parser.add_argument('-D2', '--d2', default=2, type=int, help="Device for exp 2.")
    parser.add_argument('-D3', '--d3', default=3, type=int, help="Device for exp 3.")
    return parser.parse_args()

def pipeline(library, trainset, epochs, lr,
             lmda_init, lmda_max, lmda_max_epoch, lmda_spike, lmda_spike_epoch,
             beta_init, beta_max, beta_max_epoch, beta_spike, beta_spike_epoch,
             adam_reg, gamma_factor, batch_size,
             thresh_interval, eval_interval, hard_thresh,
             run_name, runs, noise_dim, hidden_dim, stat_size, device,
             num_hidden, batch_norm):
    print(run_name)

    torch.cuda.set_device(device=device)
    device = torch.cuda.current_device()
    net = Net(library, noise_dim=noise_dim, hidden_dim=hidden_dim,
              statistic_batch_size=stat_size, num_hidden=num_hidden,
              batch_norm=batch_norm).to(device)
    net.apply(init_weights)

    trainer = Trainer(net, library, runs + run_name, runs + "cp_" + run_name + ".pt",
                      beta_init=beta_init, beta_max=beta_max, beta_max_epoch=beta_max_epoch, 
                      beta_spike=beta_spike, beta_spike_epoch=beta_spike_epoch,
                      lmda_init=lmda_init, lmda_max=lmda_max, lmda_max_epoch=lmda_max_epoch,
                      lmda_spike=lmda_spike, lmda_spike_epoch=lmda_spike_epoch,
                      learning_rate=lr, adam_reg=adam_reg, gamma_factor=gamma_factor,
                      epochs=epochs, batch_size=batch_size, device=device,
                      hard_threshold=hard_thresh, threshold_interval=thresh_interval,
                      eval_interval=eval_interval)
    trainer.train(trainset)


def load_data(library, data_folder, dataset, t, dt, model, end):
    x = np.load(data_folder + dataset + "/x_train" + str(end) + ".npy")
    if t is not None:
        t = np.load(data_folder + dataset + "/x_ts.npy")
    return SyntheticDataset(x=x, t=t, library=library, dataset=dataset, dt=dt, model=model)

def main():
    # Parse exp args
    args = parse_args()

    # Globals
    data_folder = "../data/"
    model = "HyperSINDy"
    dt = 0.01
    hidden_dim = 64
    stat_size = 250
    num_hidden = 5
    x_dim = 3
    adam_reg = 1e-2
    gamma_factor = 0.999
    poly_order = 3
    include_constant = True
    runs = "../runs/rossler_rmse/"
    t = None
    seed = 0
    
    # Individual experiments
    if args.s1 == 1:
        for i in range(10):
            seed = 400 + i
            set_random_seed(seed)
            run_name = "1_" + str(i)
            device = args.d1
            library = Library(n=x_dim, poly_order=poly_order, include_constant=include_constant)
            trainset = load_data(library, data_folder, "rossler_rmse/scale-1.0", t, dt, model, end=i)
            pipeline(library=library, trainset=trainset, epochs=499, lr=5e-3, batch_size=250,
                lmda_init=1e-2, lmda_max=1e-2, lmda_max_epoch=1, lmda_spike=1e-1, lmda_spike_epoch=200,
                beta_init=0.01, beta_max=10.0, beta_max_epoch=100, beta_spike=100, beta_spike_epoch=200,
                noise_dim=6, thresh_interval=100, hard_thresh=0.01, batch_norm=False, eval_interval=50,
                adam_reg=adam_reg, gamma_factor=gamma_factor, runs=runs, run_name=run_name, device=device,
                hidden_dim=hidden_dim, stat_size=stat_size, num_hidden=num_hidden)

    if args.s2 == 1:
        for i in range(10):
            seed = 500 + i
            set_random_seed(seed)
            run_name = "2_" + str(i)
            device = args.d2
            library = Library(n=x_dim, poly_order=poly_order, include_constant=include_constant)
            trainset = load_data(library, data_folder, "rossler_rmse/scale-5.0", t, dt, model, end=i)
            pipeline(library=library, trainset=trainset, epochs=600, lr=5e-3, batch_size=250,
                lmda_init=1e-2, lmda_max=1e-2, lmda_max_epoch=1, lmda_spike=1e-1, lmda_spike_epoch=300,
                beta_init=0.01, beta_max=25.0, beta_max_epoch=100, beta_spike=200, beta_spike_epoch=200,
                noise_dim=6, thresh_interval=100, hard_thresh=0.01, batch_norm=False, eval_interval=50,
                adam_reg=adam_reg, gamma_factor=gamma_factor, runs=runs, run_name=run_name, device=device,
                hidden_dim=hidden_dim, stat_size=stat_size, num_hidden=num_hidden)


    if args.s3 == 1:
        for i in range(10):
            seed = 600 + i
            set_random_seed(seed)
            run_name = "3_" + str(i)
            device = args.d3
            library = Library(n=x_dim, poly_order=poly_order, include_constant=include_constant)
            trainset = load_data(library, data_folder, "rossler_rmse/scale-10.0", t, dt, model, end=i)
            pipeline(library=library, trainset=trainset, epochs=600, lr=5e-3, batch_size=250,
                lmda_init=1e-2, lmda_max=1e-2, lmda_max_epoch=1, lmda_spike=1e0, lmda_spike_epoch=300,
                beta_init=0.01, beta_max=50.0, beta_max_epoch=100, beta_spike=300, beta_spike_epoch=200,
                noise_dim=6, thresh_interval=100, hard_thresh=0.01, batch_norm=False, eval_interval=50,
                adam_reg=adam_reg, gamma_factor=gamma_factor, runs=runs, run_name=run_name, device=device,
                hidden_dim=hidden_dim, stat_size=stat_size, num_hidden=num_hidden)
        

if __name__ == "__main__":
    main()