from __future__ import division
from __future__ import print_function

import time
import tensorflow.compat.v1 as tf
tf.compat.v1.disable_eager_execution()

from gcn.utils import *
from gcn.models import GCN, MLP

# Set random seed
seed = 123
np.random.seed(seed)
tf.set_random_seed(seed)


flags = tf.app.flags
FLAGS = flags.FLAGS
flags.DEFINE_string('dataset', 'cora', 'Dataset string.')  # 'cora', 'citeseer', 'pubmed'
flags.DEFINE_string('model', 'gcn', 'Model string.')  # 'gcn', 'gcn_cheby', 'dense'
flags.DEFINE_float('learning_rate', 0.01, 'Initial learning rate.')
flags.DEFINE_integer('epochs', 200, 'Number of epochs to train.')
flags.DEFINE_integer('hidden1', 16, 'Number of units in hidden layer 1.')
flags.DEFINE_float('dropout', 0.5, 'Dropout rate (1 - keep probability).')
flags.DEFINE_float('weight_decay', 5e-4, 'Weight for L2 loss on embedding matrix.')
flags.DEFINE_integer('early_stopping', 10, 'Tolerance for early stopping (# of epochs).')
flags.DEFINE_integer('max_degree', 3, 'Maximum Chebyshev polynomial degree.')

ratio_l = [ 0.3, 0.5, 0.7]
method_l = ['ones', 'random', 'adj', 'LP', 'sup', 'w2v']
fold_num = 10
acc_list_1 = np.zeros((4, 6, 10))
time_list_1 = np.zeros((4, 6, 10))


dataset_name_ = 'polblogs'

total_result = open("results_total_{}.txt".format(dataset_name_), 'a')

total_result_agg = open("results_total_agg_{}.txt".format(dataset_name_), 'a')

for ratio_c in range(0, len(ratio_l)):
    for method_c in range(0, len(method_l)):
        ratio_cnt = ratio_l[ratio_c]
        method_cnt = method_l[method_c]
        for fold_cnt in range(1, fold_num + 1):




            #time_cur = time.time()


            # Settings


            output_file = open("results_{}.txt".format('{}_{}_{}_{}'.format(dataset_name_, fold_cnt, ratio_cnt, method_cnt)), 'a')

            # Load data
            adj, features, y_train, y_val, y_test, train_mask, val_mask, test_mask = load_data('{}_{}_{}_{}'.format(dataset_name_, fold_cnt, ratio_cnt, method_cnt))
            #print(adj)
            #features_old = features

            #from scipy.sparse import csr_matrix
            #features = csr_matrix(np.zeros((2708, 1433)))
            #import numpy
            #features = csr_matrix(numpy.random.normal(size = 2708 * 1433).reshape((2708, 1433)))
            #features = csr_matrix(features.toarray()[:, 1:10])

            # Some preprocessing
            features = preprocess_features(features)
            if FLAGS.model == 'gcn':
                support = [preprocess_adj(adj)]
                num_supports = 1
                model_func = GCN
            elif FLAGS.model == 'gcn_cheby':
                support = chebyshev_polynomials(adj, FLAGS.max_degree)
                num_supports = 1 + FLAGS.max_degree
                model_func = GCN
            elif FLAGS.model == 'dense':
                support = [preprocess_adj(adj)]  # Not used
                num_supports = 1
                model_func = MLP
            else:
                raise ValueError('Invalid argument for model: ' + str(FLAGS.model))

            # Define placeholders
            placeholders = {
                'support': [tf.sparse_placeholder(tf.float32) for _ in range(num_supports)],
                'features': tf.sparse_placeholder(tf.float32, shape=tf.constant(features[2], dtype=tf.int64)),
                'labels': tf.placeholder(tf.float32, shape=(None, y_train.shape[1])),
                'labels_mask': tf.placeholder(tf.int32),
                'dropout': tf.placeholder_with_default(0., shape=()),
                'num_features_nonzero': tf.placeholder(tf.int32)  # helper variable for sparse dropout
            }

            # Create model
            model = model_func(placeholders, input_dim=features[2][1], logging=True)

            # Initialize session
            sess = tf.Session()


            # Define model evaluation function
            def evaluate(features, support, labels, mask, placeholders):
                t_test = time.time()
                feed_dict_val = construct_feed_dict(features, support, labels, mask, placeholders)
                outs_val = sess.run([model.loss, model.accuracy], feed_dict=feed_dict_val)
                return outs_val[0], outs_val[1], (time.time() - t_test)


            # Init variables
            sess.run(tf.global_variables_initializer())

            cost_val = []

            # Train model
            for epoch in range(FLAGS.epochs):

                t = time.time()
                # Construct feed dictionary
                feed_dict = construct_feed_dict(features, support, y_train, train_mask, placeholders)
                feed_dict.update({placeholders['dropout']: FLAGS.dropout})

                # Training step
                outs = sess.run([model.opt_op, model.loss, model.accuracy], feed_dict=feed_dict)

                # Validation
                cost, acc, duration = evaluate(features, support, y_val, val_mask, placeholders)
                cost_val.append(cost)

                # Print results
                time_list_1[ratio_c, method_c, fold_cnt - 1] = time_list_1[ratio_c, method_c, fold_cnt - 1] + time.time() - t

                output_file.write("{} {} {} {} {} {} {} {} {} {} {} {}\n".format("Epoch:", '%04d' % (epoch + 1), "train_loss=", "{:.5f}".format(outs[1]),
                     "train_acc=", "{:.5f}".format(outs[2]), "val_loss=", "{:.5f}".format(cost),
                     "val_acc=", "{:.5f}".format(acc), "time=", "{:.5f}".format(time.time() - t)))

                if epoch > FLAGS.early_stopping and cost_val[-1] > np.mean(cost_val[-(FLAGS.early_stopping+1):-1]):

                    output_file.write("Early stopping...\n")
                    #total_result.write("{}, fold_count = {}, label_rate = {}, method = {}, accuracy = {} \n".format(dataset_name_, fold_cnt, ratio_cnt, method_cnt, acc))
                    #acc_list_1[ratio_c, method_c, fold_cnt - 1] = acc
                    break

            output_file.write("Optimization Finished!\n")

            # Testing
            test_cost, test_acc, test_duration = evaluate(features, support, y_test, test_mask, placeholders)
            print("Test set results:", "cost=", "{:.5f}".format(test_cost), "accuracy=", "{:.5f}".format(test_acc), "time=", "{:.5f}".format(test_duration))
            output_file.write("{} {} {} {} {} {} {} \n".format("Test set results:", "cost=", "{:.5f}".format(test_cost),
                "accuracy=", "{:.5f}".format(test_acc), "time=", "{:.5f}".format(test_duration)))

            total_result.write("{}, fold_count = {}, label_rate = {}, method = {}, accuracy = {} \n".format(dataset_name_, fold_cnt, ratio_cnt, method_cnt, test_acc))

            acc_list_1[ratio_c, method_c, fold_cnt - 1] = test_acc
            time_list_1[ratio_c, method_c, fold_cnt - 1] = time_list_1[ratio_c, method_c, fold_cnt - 1] + test_duration



            output_file.close()
            #del flags


        total_result_agg.write("{},  label_rate = {}, method = {}, error (std) = {:.3f} ({:.3f}) , time = {:.3f} ({:.3f})\n".format(dataset_name_, ratio_cnt, method_cnt, 1 - np.mean(acc_list_1[ratio_c, method_c, :]), np.std(acc_list_1[ratio_c, method_c, :]), np.mean(time_list_1[ratio_c, method_c, :]), np.std(time_list_1[ratio_c, method_c, :])))

total_result.close()
total_result_agg.close()


