#Video_classification

import math
import numpy as np
import h5py
import pandas as pd
from numpy import genfromtxt
import matplotlib.pyplot as plt
import tensorflow.compat.v1 as tf
from tensorflow.python.framework import ops
from tf_utils import  random_mini_batches, convert_to_one_hot, predict, loading_train_test, loading_source_new, loading_target1, loading_target2, loading_target3, loading_sketch, loading_clipart 
from sklearn.covariance import EmpiricalCovariance


X_source, Y_source, X_test_source1, Y_test_source1= loading_clipart()
X_target1, Y_target1, X_test_target1, Y_test_target1  = loading_sketch()



X_source=X_source.to_numpy()
Y_source=Y_source.to_numpy()
X_test_source1=X_test_source1.to_numpy()
Y_test_source1=Y_test_source1.to_numpy()

X_target1=X_target1.to_numpy()
Y_target1=Y_target1.to_numpy()
X_test_target1=X_test_target1.to_numpy()
Y_test_target1=Y_test_target1.to_numpy()



###num1_S=3, num2_S=4 corresponds to Clock and Ambulance; um1_S=3, num2_S=6 corresponds to clock and crow; um1_S=6, num2_S=16 corresponds to Crow and basket  


num1_S=3
num2_S=6
x1 = np.where(Y_source == num1_S)
x2 = np.where(Y_source == num2_S)

x1=np.asarray(x1)
x1=x1[0]

x2=np.asarray(x2)
x2=x2[0]

print(type(x1))
#x1=x1.tolist()
#print(x1)
#print(X_source[x1,:].shape)

#x1=Y_source.index(num1)
#x2=Y_source.index(num2)


a1 = np.where(Y_test_source1 == num1_S)
a2 = np.where(Y_test_source1 == num2_S)

a1=np.asarray(a1)
a1=a1[0]

a2=np.asarray(a2)
a2=a2[0]

#print(x1.shape)


Y_source_binary=Y_source[x1]
Y_source_binary=np.append(Y_source_binary,Y_source[x2])

Y_source_test_binary=Y_test_source1[a1]
Y_source_test_binary=np.append(Y_source_test_binary,Y_test_source1[a2])

X_source_binary=X_source[x1,:]
X_source_binary=np.append(X_source_binary,X_source[x2,:],axis=0)

X_source_test_binary=X_test_source1[a1,:]
X_source_test_binary=np.append(X_source_test_binary,X_test_source1[a2,:],axis=0)

Y_source_binary=np.asarray(Y_source_binary)
Y_source_test_binary=np.asarray(Y_source_test_binary)




num1_T=3
num2_T=4
x1 = np.where(Y_target1 == num1_T)
x2 = np.where(Y_target1 == num2_T)

x1=np.asarray(x1)
x1=x1[0]

x2=np.asarray(x2)
x2=x2[0]
#print(type(x1))
#x1=x1.tolist()
#print(x1)
#print(X_source[x1,:].shape)

#x1=Y_source.index(num1)
#x2=Y_source.index(num2)


a1 = np.where(Y_test_target1 == num1_T)
a2 = np.where(Y_test_target1 == num2_T)

a1=np.asarray(a1)
a1=a1[0]

a2=np.asarray(a2)
a2=a2[0]

print(x1.shape)

Y_target_binary=Y_target1[x1]
Y_target_binary=np.append(Y_target_binary,Y_target1[x2])

Y_target_test_binary=Y_test_target1[a1]
Y_target_test_binary=np.append(Y_target_test_binary,Y_test_target1[a2])

X_target_binary=X_target1[x1,:]
X_target_binary=np.append(X_target_binary,X_target1[x2,:],axis=0)

X_target_test_binary=X_test_target1[a1,:]
X_target_test_binary=np.append(X_target_test_binary,X_test_target1[a2,:],axis=0)

Y_target_binary=np.asarray(Y_target_binary)
Y_target_test_binary=np.asarray(Y_target_test_binary)








for i in range(len(Y_source_binary)):
    #print(num1)
    if Y_source_binary[i]==num1_S:
        Y_source_binary[i]=0
    if Y_source_binary[i]==num2_S:
        Y_source_binary[i]=1

for i in range(len(Y_source_test_binary)):
    if Y_source_test_binary[i]==num1_S:
        Y_source_test_binary[i]=0
    if Y_source_test_binary[i]==num2_S:
        Y_source_test_binary[i]=1        

        
for i in range(len(Y_target_test_binary)):
    if Y_target_test_binary[i]==num1_T:
        Y_target_test_binary[i]=0
    if Y_target_test_binary[i]==num2_T:
        Y_target_test_binary[i]=1
        
for i in range(len(Y_target_binary)):
    if Y_target_binary[i]==num1_T:
        Y_target_binary[i]=0
    if Y_target_binary[i]==num2_T:
        Y_target_binary[i]=1




Y_source_binary=Y_source_binary.T
Y_source_test_binary=Y_source_test_binary.T
Y_target_binary=Y_target_binary.T
Y_target_test_binary=Y_target_test_binary.T



X_source_binary=X_source_binary.T
X_source_test_binary=X_source_test_binary.T
X_target_binary=X_target_binary.T
X_target_test_binary=X_target_test_binary.T



Y_S=np.zeros((1, len(Y_source_binary)))
Y_S_test=np.zeros((1, len(Y_source_test_binary)))
Y_T=np.zeros((1, len(Y_target_binary)))
Y_T_test=np.zeros((1, len(Y_target_test_binary)))


for i in range(len(Y_source_binary)):
    Y_S[0,i]=Y_source_binary[i]
for i in range(len(Y_source_test_binary)):
    Y_S_test[0,i]=Y_source_test_binary[i]
for i in range(len(Y_target_binary)):
    Y_T[0,i]=Y_target_binary[i]
for i in range(len(Y_target_test_binary)):
    Y_T_test[0,i]=Y_target_test_binary[i]




from random import shuffle
N=Y_S.shape[1]
ind_list = list(range(N))
shuffle(ind_list)
Y_S=Y_S[:,ind_list]
X_source_binary=X_source_binary[:,ind_list]

N=Y_S_test.shape[1]
ind_list = list(range(N))
shuffle(ind_list)
Y_S_test=Y_S_test[:,ind_list]
X_source_test_binary=X_source_test_binary[:,ind_list]

N=Y_T.shape[1]
ind_list = list(range(N))
shuffle(ind_list)
Y_T=Y_T[:,ind_list]
X_target_binary=X_target_binary[:,ind_list]


N=Y_T_test.shape[1]
ind_list = list(range(N))
shuffle(ind_list)
Y_T_test=Y_T_test[:,ind_list]
X_target_test_binary=X_target_test_binary[:,ind_list]


def create_placeholders(n_x, n_y):
    
    
    X = tf.placeholder(tf.float32, shape=[n_x, None])
    Y = tf.placeholder(tf.float32, shape=[n_y, None])
    
    
    return X, Y


def initialize_parameters_source_classification():
    
    
    tf.set_random_seed(1)                   
        
    
    W1 = tf.get_variable("W1", [15,2048], initializer = tf.glorot_uniform_initializer(seed = 1))
    b1 = tf.get_variable("b1", [15,1], initializer = tf.zeros_initializer())
    
    W2 = tf.get_variable("W2", [1,15], initializer = tf.glorot_uniform_initializer(seed = 1))
    b2 = tf.get_variable("b2", [1,1], initializer = tf.zeros_initializer())
    
    ### END CODE HERE ###

    parameters = {"W1": W1,
                  "b1": b1,
                  "W2": W2,
                  "b2": b2,
                  }
    
    return parameters


def initialize_parameters_target_classification():
    
    
    tf.set_random_seed(1)                   
        
    
    W1 = tf.get_variable("W1", [15,2048], initializer = tf.glorot_uniform_initializer(seed = 1))
    b1 = tf.get_variable("b1", [15,1], initializer = tf.zeros_initializer())
    
    W2 = tf.get_variable("W2", [1,15], initializer = tf.glorot_uniform_initializer(seed = 1))
    b2 = tf.get_variable("b2", [1,1], initializer = tf.zeros_initializer())
    
    ### END CODE HERE ###

    parameters = {"W1": W1,
                  "b1": b1,
                  "W2": W2,
                  "b2": b2,
                  }
    
    return parameters


def forward_propagation_classification(X, parameters):
    
    W1 = parameters['W1']
    b1 = parameters['b1']
    
    W2 = parameters['W2']
    b2 = parameters['b2']
    
   
    
                  
    Z1 = tf.add(tf.matmul(W1,X),b1)                                             
    
    A1= tf.nn.relu(Z1)
    
    Z2 =tf.add(tf.matmul(W2,A1),b2)    
                                                                                            
    
    
    return Z2

def compute_cost_classification(Z2, Y):
    
    
    logits = tf.transpose(Z2)
    labels = tf.transpose(Y)
    cost = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(logits=logits, labels=labels))
    
    
    return cost



def model(X_train, Y_train,X_test, Y_test, learning_rate = 0.0001,
          num_epochs = 80, minibatch_size =1 , print_cost = True, source=True, target=False):
    
    
   
    
    ops.reset_default_graph()                         # to be able to rerun the model without overwriting tf variables                            # to keep consistent results
    seed = 3                                          # to keep consistent results
    (n_x, m) = X_train.shape                          # (n_x: input size, m : number of examples in the train set)
    n_y = Y_train.shape[0]                            # n_y : output size
    costs = []                                        # To keep track of the cost
    
    # Create Placeholders of shape (n_x, n_y)
    
    X, Y = create_placeholders(n_x, n_y)
    
    if source==True and target==False:  
        #parameters = initialize_parameters_source()
        parameters=initialize_parameters_source_classification()
        print("source")
    if source==False and target==True:
        #parameters = initialize_parameters_target()
        parameters=initialize_parameters_target_classification()
        print("target")
   

    
    
   
    Z2 = forward_propagation_classification(X, parameters)
    
    
    cost=compute_cost_classification(Z2, Y)
    
    optimizer = tf.train.AdamOptimizer(learning_rate = learning_rate).minimize(cost)
    
    
    # Initialize all the variables
    init = tf.global_variables_initializer()

    # Start the session to compute the tensorflow graph
    with tf.Session() as sess:
        
        # Run the initialization
        sess.run(init)
        
        # Do the training loop
        for epoch in range(num_epochs):

            epoch_cost = 0.                       # Defines a cost related to an epoch
            num_minibatches = int(m / minibatch_size) # number of minibatches of size minibatch_size in the train set
            seed = seed + 1
            minibatches = random_mini_batches(X_train, Y_train, minibatch_size, seed)

            for minibatch in minibatches:

                # Select a minibatch
                (minibatch_X, minibatch_Y) = minibatch
                
                
                _ , minibatch_cost = sess.run([optimizer, cost], feed_dict={X: minibatch_X, Y: minibatch_Y})
                
                
                epoch_cost += minibatch_cost / minibatch_size

            
            if print_cost == True and epoch % 10 == 0:
                print ("Cost after epoch %i: %f" % (epoch, epoch_cost))
            if print_cost == True and epoch % 5 == 0:
                costs.append(epoch_cost)
                
        

        
        parameters = sess.run(parameters)
        print ("Parameters have been trained!")
       
            
        

        
        return parameters

def model_weighted(X_train_source, Y_train_source,X_train_target,Y_train_target,X_test_target, Y_test_target,lam=.2, learning_rate = 0.0001,
    
    
    ops.reset_default_graph()                         # to be able to rerun the model without overwriting tf variables                            # to keep consistent results
    seed = 3                                          # to keep consistent results
    (n_x_source, m_source) = X_train_source.shape
    (n_x_target, m_target) = X_train_target.shape                          # (n_x: input size, m : number of examples in the train set)
    n_y_source = Y_train_source.shape[0] 
    n_y_target = Y_train_target.shape[0]                            # n_y : output size
    costs = []                                        # To keep track of the cost
    
    # Create Placeholders of shape (n_x, n_y)
    
    X_source, Y_source = create_placeholders(n_x_source, n_y_source)
    X_target, Y_target = create_placeholders(n_x_target, n_y_target)
    parameters=initialize_parameters_target_classification()
    
   

   
    Z2_source = forward_propagation_classification(X_source, parameters)
    Z2_target = forward_propagation_classification(X_target, parameters)
    
    
    # Cost function: Add cost function to tensorflow graph
    
    cost = compute_cost_weighted(Z2_source, Y_source,Z2_target,Y_target,lam)
    #cost1 = compute_cost1(Z2_target, Y_target)
    
    
    # Backpropagation: Define the tensorflow optimizer.
    
    optimizer = tf.train.AdamOptimizer(learning_rate = learning_rate).minimize(cost)
    
    
    # Initialize all the variables
    init = tf.global_variables_initializer()

    # Start the session to compute the tensorflow graph
    with tf.Session() as sess:
        
        # Run the initialization
        sess.run(init)
        
        # Do the training loop
        for epoch in range(num_epochs):

            epoch_cost = 0.                       # Defines a cost related to an epoch
            #num_minibatches = int(m / minibatch_size) # number of minibatches of size minibatch_size in the train set
            seed = seed + 1
            #minibatches = random_mini_batches(X_train, Y_train, minibatch_size, seed)

            #for minibatch in minibatches:

                # Select a minibatch
             #   (minibatch_X, minibatch_Y) = minibatch
                
                # IMPORTANT: The line that runs the graph on a minibatch.
                # Run the session to execute the "optimizer" and the "cost", the feedict should contain a minibatch for (X,Y).
                ### START CODE HERE ### (1 line)
            _ , minibatch_cost = sess.run([optimizer, cost], feed_dict={X_source: X_train_source, Y_source: Y_train_source, X_target: X_train_target, Y_target: Y_train_target})
                ### END CODE HERE ###
                
            epoch_cost += minibatch_cost 
            
            
        parameters = sess.run(parameters)
        
        
        return parameters

parameters = model(X_source_binary, Y_S, X_source_test_binary, Y_S_test ,source=True, target=False)


def sigmoid(X):
   return 1/(1+np.exp(-X))

def relu(x):
    return np.maximum(0, x)

#EVALUATION OF SOURCE ON TARGET

test_acc=0
N1=Y_T_test.shape[1]*1.0
for i in range(Y_T_test.shape[1]):
    a=np.dot(parameters['W1'],X_target_test_binary[:,i])
    mid_size=parameters['W1'].shape[0]
    a=a.reshape((mid_size, 1))
    a=a+parameters['b1']
    #print(a.shape)
    a=relu(a)
    a=np.dot(parameters['W2'],a)+parameters['b2']
    a=sigmoid(a)
    if a>.5 and Y_T_test[:,i]==1:
        test_acc=test_acc+1
    if a<.5 and Y_T_test[:,i]==0:
        test_acc=test_acc+1
test_acc=test_acc/N1
print(test_acc)

