import torch
import numpy as np
import math
from torch.utils.data import Dataset, DataLoader
from torch.autograd import Variable
from sklearn.model_selection import train_test_split
import torch.nn as nn
import matplotlib.pyplot as plt
from sklearn import preprocessing
import random
import matplotlib as mpl
import os
import gc
import pandas as pd
import csv
from numpy import *
from torch.utils.tensorboard import SummaryWriter
from datetime import date
import time
import builtins
from sklearn.metrics import balanced_accuracy_score, confusion_matrix,mean_absolute_error,r2_score, mean_squared_error
from complor import dataset, complor_network

   
# which_data = input('Enter the dataset for which you want to calculate the token importance (train,valid,test):')

## Dataloader
batch_size = 256
class spiderdataset(Dataset) :
    def __init__(self,ohe,seq_len,n_samples) :
        # data loading
        self.ohe = torch.from_numpy(ohe.astype(np.float32))
        self.seq_len = torch.from_numpy(seq_len.astype(int64))
        self.n_samples = n_samples 
        
    def __getitem__(self,index) :
        return self.ohe[index], self.seq_len[index]
    def __len__(self):    
        return self.n_samples      

def make_dataset(ohe_valid, seq_len_valid): 

 
    test_dataset = spiderdataset(ohe_valid,seq_len_valid,ohe_valid.shape[0])

      
    test_loader = DataLoader(dataset=test_dataset,
                            batch_size=batch_size,
                            shuffle=False)   
    
    return  test_loader, ohe_valid.shape[0], ohe_valid.shape[1]

    
def initalize(rank):  
    script_dir = os.path.dirname(os.path.abspath(__file__))
    print(torch.cuda.is_available())
    print(torch.cuda.device_count())
    color_args = np.load(f'{script_dir}/model/save_dict.npy', allow_pickle=True).tolist()
    model = complor_network(1,color_args['q'], color_args['d'],color_args['max_m'], rank) 
    model.load_state_dict(torch.load(f'{script_dir}/model/best.pth'))
    # model = torch.load('./model/best.pth')
    # rank = device
    model.eval().to(rank) 
    # print('Number of trainable parameters:', builtins.sum(p.numel() for p in model.parameters()))
    criterion = nn.MSELoss()
    optimizer = torch.optim.Adam(model.parameters(), lr=0.0001)
    
    return model, criterion,optimizer

def contribution_score(model, criterion,optimizer,ohe, seq_len,rank):  
    test_loader, test_size, max_seq_len  = make_dataset(ohe, seq_len)
    # model, criterion, optimizer = initalize(rank)
    # rank = next(model.parameters()).device 
    store_importance = torch.zeros((test_size, max_seq_len)).to(rank)
    count_test = 0
    for _, (i_x,i_seq) in enumerate(test_loader):
        i_x = i_x.to(rank) #.type(dtype=torch.float32)
        i_seq = i_seq.to(rank).type(dtype=torch.float32)
        i_batch = i_x.size(0)
        iter_y_pred, cam,_,_ = model.forward_motif_importance(i_x, i_seq)

        base_loss = torch.sum(iter_y_pred)
        optimizer.zero_grad()
        base_loss.backward()
        

        cam = cam[0]
        # print('Size of the gradient',cam.size())

        
        for prot in range(cam.size(0)):
            cam[prot,...] = cam[prot,...]/(torch.max(abs(cam[prot,...]))+1E-18)
            
        for m_i in range(cam.size(-1)):
            mo_level_imp = \
                model.calculate_motif_level(cam[...,m_i], m_i+1)
            

            kernel_size = max_seq_len - mo_level_imp.size(-1) + 1
            store_importance[count_test:count_test+i_batch,...] += model.assigning_importance(mo_level_imp, kernel_size, max_seq_len)

        
        count_test += i_batch
    
    with torch.no_grad():   
        return store_importance.to('cpu').numpy()

