import networkx as nx
import numpy as np
from config import config_initialization
from scipy.sparse import dia_matrix, diags
from KDD_algo import compute_exact_HT_rtoB, Greedy_plusplus, Greedy_plus, Greedy_plusplus_BestofMany, compute_exact_HT_rtoB_PR
import os, time, pickle

import os, time
import sys
import math
import argparse
import itertools

from collections import defaultdict

import pickle
import multiprocessing as mp
from scipy.sparse import dia_matrix, diags

import parallel_walks
import parallel_addition
import parallel_centrality
from algo import Algorithms
from load_data import LoadData
from load_data import LoadDataRandomColors
from random_walks import chunk_random_walk
from utils import load_bubble_diameter, get_bad_and_good_nodes, get_centralities, HittingTime_sample
from matplotlib import pyplot as plt
from controversy_for_edges import compute_ROV_candidate_edge
from optimalMinimization import algoOpt, personalize_adj
import json
PATHHOME=""

class NpEncoder(json.JSONEncoder):
    def default(self, obj):
        if isinstance(obj, np.integer):
            return int(obj)
        if isinstance(obj, int64):
            return int(obj)
        if isinstance(obj, np.floating):
            return float(obj)
        if isinstance(obj, np.ndarray):
            return obj.tolist()
        return super(NpEncoder, self).default(obj)

def computePerson(G_R, R, B, person=0):
    if person==0:
        G_scc = G_R.copy()
        NN = len(G_scc.nodes)
        avec = np.ones(NN)/NN
    elif person==1: # Jump according to component size
        comps = list(nx.strongly_connected_components(G_R))
        NN = G_R.number_of_nodes()
        avec = np.zeros(NN)
        norm = sum([len(curr_comp) for curr_comp in comps]) # should be the number of nodes
        #print("n_R", G_R.number_of_nodes(), norm)
        r_degss = {r: G_R.out_degree(r) for r in G_R.nodes}

        idx =0
        R_nodes_map = {}
        for nod in list(G_R.nodes):
            R_nodes_map[nod] = idx
            idx = idx + 1

        for comp in comps:
            for element in comp:
                avec[R_nodes_map[element]] = 1./(len(comp)*len(comps))
    elif person==2: # Jump according to component size and node degree
        comps = list(nx.strongly_connected_components(G_R))
        NN = G_R.number_of_nodes()
        avec = np.zeros(NN)
        norm = sum([len(curr_comp) for curr_comp in comps]) # should be the number of nodes
        r_degss = {r: G_R.out_degree(r) for r in G_R.nodes}
        idx =0
        R_nodes_map = {}
        for nod in list(G_R.nodes):
            R_nodes_map[nod] = idx
            idx = idx + 1
        norm_degs = sum([G_R.out_degree(r)+G_R.in_degree(r) for r in G_R.nodes]) # should be twice the number of edges in G_R
        #print("2m_R", 2*G_R.number_of_edges(), norm_degs)
        for comp in comps:
            for element in comp:
                #avec[R_nodes_map[element]] = (G_R.out_degree(element)+G_R.in_degree(element))/(len(comp)*len(comps)*norm_degs)
                avec[R_nodes_map[element]] = 0.5*(G_R.out_degree(element)+G_R.in_degree(element))/(norm_degs) + 0.5*1./(len(comp)*len(comps))
    return avec

def personalize_matrix(G2, R, p_vec, damping):
    A = nx.to_numpy_array(G2)
    row_sums = A.sum(axis=1, keepdims=True)  # Compute row sums
    mat = A / row_sums  # Element-wise division
    mat[:, R] =  damping * mat[:, R] + (1-damping)*p_vec
    return mat
    

def hitting_times_exact(G, A, B):
    """
    Compute the exact hitting time vector from nodes in A to any node in B.

    Parameters:
    G : networkx.Graph
        An undirected or directed graph.
    A : set
        Set of starting nodes.
    B : set
        Set of target nodes.

    Returns:
    dict
        Dictionary of hitting times for each node in A.
    """
    nodes = list(G.nodes)
    n = len(nodes)
    
    # Node index mapping
    index_map = {node: i for i, node in enumerate(nodes)}

    # Construct transition matrix P
    P = np.zeros((n, n))
    for i, u in enumerate(nodes):
        neighbors = list(G.neighbors(u))
        if neighbors:
            P[i, [index_map[v] for v in neighbors]] = 1 / len(neighbors)
    
    # Extract submatrices
    A_indices = np.array([index_map[v] for v in A])
    B_indices = np.array([index_map[v] for v in B])
    
    P_AA = P[np.ix_(A_indices, A_indices)]
    P_AB = P[np.ix_(A_indices, B_indices)]
    
    # Identity matrix
    I_A = np.eye(len(A))
    
    # Solve (I - P_AA) h = 1
    h = np.linalg.solve(I_A - P_AA, np.ones(len(A)))
    
    # Map results to original node labels
    hitting_times = {nodes[i]: h[j] for j, i in enumerate(A_indices)}
    
    return hitting_times

def KDD_visualization_exactgreedy(A_republink, add_size, G_s, pi_R):
    '''
    get results of Kdd greedy algorithm
    :param A_republink: adjcency matrix of republink paper
    :return: hitting time array [ht after adding k1 edges, ht after adding k2 edges, ..]
    '''
    dictres = {}
    matrixA = A_republink.A
    G = nx.from_numpy_matrix(matrixA, create_using=nx.Graph())
    G_R_nodes = list(G_s.nodes)
    R = [i for i in range(numOfNode) if color_nodes[i] == 'red']
    B = [i for i in range(numOfNode) if color_nodes[i] == 'blue']

    K = add_size
    step = int(K/10)
    NumEdges = np.arange(0, K+step, step)  # x values to show in the figure
    x_axis, avgHT, maxHT, steadyHT = [], [], [], []

    st = time.time()
    G_new_list = Greedy_plus(G, R, B, NumEdges)
    en = time.time()
    rtGR = en-st


    for i, num in enumerate(NumEdges):
        G_i = G_new_list[i]
        HT = compute_exact_HT_rtoB(G_i, R, B)
        HT_R = np.array(HT)[G_R_nodes].tolist()
        stHT = sum([w*ht for (w, ht) in zip(pi_R, HT_R)])
        avght = sum(HT_R) / len(R)
        maxht = max(HT_R)
        avgHT.append(avght)
        maxHT.append(maxht)
        steadyHT.append(stHT)
        x_axis.append(num)
    dictres = {"kvect":x_axis, "averages": avgHT, "maxVec":maxHT, "steadyVec":steadyHT, "runtime": rtGR, "algo": "Greedy"}
    return dictres

def GetScoresOpt(A_republink, add_size, edgesToAdd, G_s, pi_R, PR=False, person=0, directed=False, damping=0.75):
    dictres = {}
    matrixA = A_republink.A
    if directed:
        G = nx.from_numpy_matrix(matrixA, create_using=nx.DiGraph())
    else:
        G = nx.from_numpy_matrix(matrixA, create_using=nx.Graph())
    G2 = G.copy()
    G_R_nodes = list(G_s.nodes)
    numOfNode = len(G.nodes)
    R = [i for i in range(numOfNode) if color_nodes[i] == 'red']
    B = [i for i in range(numOfNode) if color_nodes[i] == 'blue']
    print("COLORS", R, B)
    K = add_size
    step = int(K/10)

    NumEdges = np.arange(0, K+step, step)  # x values to show in the figure
    x_axis, avgHT, maxHT, steadyHT = [], [], [], []
    if PR:
        G_R = nx.induced_subgraph(G, R)
        p_vec = computePerson(G_R, R, B, person)

    prev = 0
    for i, num in enumerate(NumEdges):
        j = 0
        while prev + j < num and prev+j < len(edgesToAdd):
            G2.add_edge(edgesToAdd[prev+j][0], edgesToAdd[prev+j][1])
            j = j+1
        if PR:
            P_pr = personalize_matrix(G2, R, p_vec, damping)
            HT = compute_exact_HT_rtoB_PR(P_pr, R, B)
        else:
            HT = compute_exact_HT_rtoB(G2, R, B)
        if PR:
            HT_R = list(HT.values())
        else:
            HT_R = np.array(HT)[G_R_nodes].tolist()
        stHT = sum([w*ht for (w, ht) in zip(pi_R, HT_R)])
        avght = sum(HT_R) / len(R)
        maxht = max(HT_R)
        avgHT.append(avght)
        maxHT.append(maxht)
        steadyHT.append(stHT)
        x_axis.append(num)
    if PR:
        dictres = {"kvect":x_axis, "averages": avgHT, "maxVec":maxHT, "steadyVec":steadyHT, "algo": "OPT-PR", "pesonalization":person, "directed":directed, "damping":damping}
    else:
        dictres = {"kvect":x_axis, "averages": avgHT, "maxVec":maxHT, "steadyVec":steadyHT, "algo": "OPT"}
    return dictres
        

def calculate_raduis(mypath):

    print("Number of walks per node: ", r)


    myruntime = 0
    if not os.path.exists(PATHHOME + mypath + '/'):
        os.makedirs(PATHHOME + mypath + '/')

    # Compute bubble diameter
    st = time.time()
    result_chunks = parallel_walks.parallelization(A, labels, args.t, color_nodes, r)
    et = time.time()
    myruntime = myruntime + (et-st)
    
    with open(PATHHOME + mypath + '/bubble_diameters.pickle', 'wb') as f:
        pickle.dump(result_chunks, f)

    bubble_diameter = load_bubble_diameter(mypath, id_matrix_node, args.t)  # {5721464：5.933110367892977}
    red_bubble_diameter, blue_bubble_diameter, bad_red_vertices, bad_blue_vertices = get_bad_and_good_nodes(
        bubble_diameter, id_color, args.b, args.t)  # dictionary {5721464：5.933110367892977}


    # Compute bad nodes centralities Blue
    nodes = np.array([node_id_matrix[n] for n in bad_blue_vertices])  # 0 1 2 3 4
    print('Number blue bad nodes: ', len(nodes))
    result_chunks = parallel_centrality.parallelization(A, labels, args.t, color_nodes, r, nodes)
    with open(PATHHOME + mypath + '/' + 'blue' + '_centralities.pickle', 'wb') as f:
        pickle.dump(result_chunks, f)


    # Compute bad nodes centralities Red
    st = time.time()
    nodes = np.array([node_id_matrix[n] for n in bad_red_vertices])  # 0 1 2 3 4
    print('Number red bad nodes: ', len(nodes))
    result_chunks = parallel_centrality.parallelization(A, labels, args.t, color_nodes, r, nodes)
    et = time.time()
    myruntime = myruntime + (et-st)
    with open(PATHHOME + args.topic + '/' + 'red' + '_centralities.pickle', 'wb') as f:
        pickle.dump(result_chunks, f)

    return myruntime, red_bubble_diameter, blue_bubble_diameter, bad_red_vertices, bad_blue_vertices

def save_statisitcs():
    statisitcs = {}
    statisitcs['num of node'] = len(G.nodes)
    statisitcs['num of Red node'] = len(bad_red_vertices)  # should flip red and blue
    statisitcs['num of blue node'] = len(bad_blue_vertices)
    crossing = 0
    for i in bad_red_vertices.keys():
        for j in bad_blue_vertices.keys():
            if (i,j) in G.edges or (j,i) in G.edges():
                crossing += 1
    statisitcs['RxB'] = crossing
    statisitcs['num of all edges'] = len(G.edges)

    return statisitcs

def save_statisitcs_j():
    statisitcs = {}
    statisitcs['num of node'] = len(G.nodes)
    statisitcs['num of Red node'] = len(R)  # should flip red and blue
    statisitcs['num of blue node'] = len(B)
    crossing = 0
    for i in R:
        for j in B:
            if (id_matrix_node[i],id_matrix_node[j]) in G.edges or (id_matrix_node[j],id_matrix_node[i]) in G.edges():
                crossing += 1
    statisitcs['RxB'] = crossing
    statisitcs['num of all edges'] = len(G.edges)

    return statisitcs

def normalize_rows(matrix):
    row_sums = matrix.sum(axis=1, keepdims=True)  # Compute row sums
    return matrix / row_sums  # Element-wise division

if __name__ == '__main__':
    topics = ['guns','math_tech','tech_mil','abortion','sociology']
    maxedges = [130, 160, 20, 200, 600]  # as close to number of bad nodes as possible. In this work bad = red
    typ = 4
    isGraphDirected = False
    iterations = 1
    if typ == 0:
        topics = ['math_tech','tech_mil']
        maxedges = [130, 20]  # as close to number of bad nodes as possible. In this work bad = red
    elif typ == 1:
        topics = ['abortion']
        maxedges = [1000]  # as close to number of bad nodes as possible. In this work bad = red
    elif typ == 2:
        topics = ['guns']
        maxedges = [130]  # as close to number of bad nodes as possible. In this work bad = red
    elif typ == 3:
        #topics = ['math_ast', "polblogs", "politics"]
        #maxedges = [800, 2000, 600]  # as close to number of bad nodes as possible. In this work bad = red
        topics = ["polblogs"]
        maxedges = [2000]  # as close to number of bad nodes as possible. In this work bad = red
    elif typ == 4:
        topics = ['sociology']
        maxedges = [2000]  # as close to number of bad nodes as possible. In this work bad = red
    elif typ == 5:
        topics = ["politics"]
        maxedges = [6000]  # as close to number of bad nodes as possible. In this work bad = red
    elif typ == 6:
        topics = ["data/large/soc-brightkite.mtx"]
        maxedges = [40000]  # as close to number of bad nodes as possible. In this work bad = red
    elif typ == 7:
        topics = ["data/large/ca-dblp-2012.mtx"]
        maxedges = [30000]  # as close to number of bad nodes as possible. In this work bad = red
    elif typ == 8:
        topics = ["data/large/twitter_combined.txt"]
        maxedges = [1000]  # as close to number of bad nodes as possible. In this work bad = red
    elif typ == 9:
        topics = ["data/large/gplus_combined.txt"]
        maxedges = [10000]  # as close to number of bad nodes as possible. In this work bad = red
    outPath = ""
    PATHHOME = outPath
    largedata = False
    if typ > 5:
        largedata = True
    PR = False # ONLY AVAILABLE FOR SMALL DATA!
    DAMP = 0.85

    if largedata == True:
        for idx, topic in enumerate(topics):
            args = config_initialization()
            args.maxedges = maxedges[idx]
            data = LoadDataRandomColors(topic, uniform=True, directed=isGraphDirected)
            id_color = data.id_color

            #TODO: Fix the possibility to load the graph as directed
            G = data.G
            node_id_matrix = {n: i for i, n in enumerate(list(G.nodes()))}  # {5721464：0} str id - int id
            id_matrix_node = {j: i for i, j in node_id_matrix.items()}
            labels = np.array([j for i, j in sorted([(i, j) for i, j in id_matrix_node.items()], key=lambda x: x[
                0])])
            color_nodes = np.array([id_color[j] for i, j in sorted([(i, j) for i, j in id_matrix_node.items()],
                                                                   key=lambda x: x[
                                                                       0])])  # [red, blue] for int id [0 1 2 3 4 5]

            numOfNode = len(G.nodes)

            Adjacency = nx.adjacency_matrix(G)
            d = diags(1/Adjacency.sum(axis=1).A.ravel()) #Diagonal matrix [0,...1/d_i,...,0] aka D^(-1)
            A = Adjacency.T.dot(d).T


            delta = 0.05
            eps = 1
            r = int((args.t ** 2) / (eps ** 2) * np.log(1 / delta))
            ITER = 1

            R = [i for i in range(numOfNode) if color_nodes[i] == 'red']
            B = [i for i in range(numOfNode) if color_nodes[i] == 'blue']
            pi_R = []
            if not isGraphDirected:
                G_CPY = nx.from_numpy_matrix(Adjacency.A, create_using=nx.Graph())
                G_R = nx.induced_subgraph(G_CPY, R)
                largest = max(nx.connected_components(G_R), key=len)
                comp_sizes = [len(comp) for comp in nx.connected_components(G_R)]
            elif isGraphDirected:
                G_CPY = nx.from_numpy_matrix(Adjacency.A, create_using=nx.DiGraph())
                G_R = nx.induced_subgraph(G_CPY, R)
                comps = list(nx.strongly_connected_components(G_R))
                compss = sorted(comps, key=len, reverse=True)
                comp_sizes = [len(comp) for comp in comps]
                largest = max(nx.strongly_connected_components(G_R), key=len)
            
            statisitcs = save_statisitcs_j()
            fwoext, _ = os.path.splitext(topic)
            print(fwoext)
            if isGraphDirected:
                fpj = fwoext + '-statistics-dir.json'
            else:
                fpj = fwoext + '-statistics.json'
            statisitcs["comps"] = comp_sizes
            print("FWOEXT", fwoext)
            with open(fpj, 'w') as fil:
                mystats = json.dump(statisitcs, fil, cls=NpEncoder)

            
            K = maxedges[idx]
            print('number of edges to add to graph is', K)
            print('Running PARITY')
            optRes = {}
            runtimes = []
            if isGraphDirected:
                for _ in range(iterations):
                    st = time.time()
                    optAdditions, stat_pi = algoOpt(Adjacency, color_nodes, K, directed=isGraphDirected, powerMethod=True)
                    et = time.time()
                    elapsed_time = et - st
                    runtimes.append(elapsed_time)
                optRes["runtime-vec"] = runtimes
            else:
                for _ in range(iterations):
                    st = time.time()
                    optAdditions, stat_pi = algoOpt(Adjacency, color_nodes, K, directed=isGraphDirected)
                    et = time.time()
                    elapsed_time = et - st
                    runtimes.append(elapsed_time)
                optRes["runtime-vec"] = elapsed_time
            print("RT-OPT", elapsed_time)
            optRes["runtime"] = elapsed_time
            myresults = {"OPT":optRes}
            myresults["Dataset"] = topic
            fpj = fwoext + '-fullRes.json'
            if isGraphDirected:
                fpj = fwoext + '-fullResDir.json'
            with open(fpj, 'w') as fil:
                mystats = json.dump(myresults, fil, cls=NpEncoder)
            print(myresults["OPT"])
            exit(0)
        

    for idx, topic in enumerate(topics):
        args = config_initialization()
        args.topic = topic
        args.maxedges = maxedges[idx]

        retainOrig = False
        if PR:
            retainOrig = True
        print(retainOrig)
        data = LoadData(args.topic, uniform=True, directed=isGraphDirected, retainOrig=retainOrig)

        id_color = data.id_color
        G = data.G
        node_id_matrix = {n: i for i, n in enumerate(list(G.nodes()))}  # {5721464：0} str id - int id
        id_matrix_node = {j: i for i, j in node_id_matrix.items()}
        labels = np.array([j for i, j in sorted([(i, j) for i, j in id_matrix_node.items()], key=lambda x: x[
            0])])
        color_nodes = np.array([id_color[j] for i, j in sorted([(i, j) for i, j in id_matrix_node.items()],
                                                               key=lambda x: x[
                                                                   0])])  # [red, blue] for int id [0 1 2 3 4 5]
        if PR:
            K = maxedges[idx]
            fwoext, _ = os.path.splitext(topic)
            print(fwoext)
            optRes = {}
            if not isGraphDirected:
                print("Use directed PageRank!")
                exit(0)
            Adjacency = nx.adjacency_matrix(G)
            runtimes = {}
            for idx in range(3):
                st = time.time()
                optAdditionsPR, stat_PR = algoOpt(Adjacency, color_nodes, K, directed=isGraphDirected, powerMethod=True, pagerank=True, person=idx, damping=DAMP)
                et = time.time()
                elapsed_time = et - st
                runtimes[idx] = elapsed_time
                optRes2 = GetScoresOpt(Adjacency, K, optAdditionsPR, G, stat_PR, PR=True, person=idx, directed=isGraphDirected, damping=DAMP)
                optRes2["runtime"] = elapsed_time
                optRes[idx] = optRes2
            optRes["Dataset"] = topic
            topicPath = topic
            fpj =  outPath + topicPath + '/ResultsPR.json'
            print(fpj)
            with open(fpj, 'w') as fil:
                mystats = json.dump(optRes, fil, cls=NpEncoder)
            exit(0)
            

        numOfNode = len(G.nodes)

        Adjacency = nx.adjacency_matrix(G)
        d = diags(1/Adjacency.sum(axis=1).A.ravel()) #Diagonal matrix [0,...1/d_i,...,0] aka D^(-1)
        A = Adjacency.T.dot(d).T


        delta = 0.05
        eps = 1
        r = int((args.t ** 2) / (eps ** 2) * np.log(1 / delta))
        ITER = 1

        R = [i for i in range(numOfNode) if color_nodes[i] == 'red']
        B = [i for i in range(numOfNode) if color_nodes[i] == 'blue']
        pi_R = []
        if not isGraphDirected:
            G_CPY = nx.from_numpy_matrix(Adjacency.A, create_using=nx.Graph())
            print(R)
            G_R = nx.induced_subgraph(G_CPY, R)
            largest = max(nx.connected_components(G_R), key=len)
            comp_sizes = [len(comp) for comp in nx.connected_components(G_R)]
            G_scc = G_R.subgraph(largest).copy()
            deg_vec = [v[1] for v in list(G_scc.degree())]
            #print("deg", deg_vec)
            two_m_G_R = sum(deg_vec)
            pi_R = [deg/(1.*two_m_G_R) for deg in deg_vec]
        elif isGraphDirected:
            G_CPY = nx.from_numpy_matrix(Adjacency.A, create_using=nx.DiGraph())
            G_R = nx.induced_subgraph(G_CPY, R)
            comps = list(nx.strongly_connected_components(G_R))
            compss = sorted(comps, key=len, reverse=True)
            comp_sizes = [len(comp) for comp in comps]
            largest = max(nx.strongly_connected_components(G_R), key=len)
            
            # Create the induced subgraph
            G_scc = G_R.subgraph(compss[0]).copy()
            A_R = nx.adjacency_matrix(G_scc).A
            normalizedA = normalize_rows(A_R)
            #We have to transpose so that Markov transitions correspond to right multiplying by a column vector.  np.linalg.eig finds right eigenvectors.
            evals, evecs = np.linalg.eig(normalizedA.T)
            evec1 = evecs[:,np.isclose(evals, 1)]

            #Since np.isclose will return an array, we've indexed with an array
            #so we still have our 2nd axis.  Get rid of it, since it's only size 1.
            evec1 = evec1[:,0]

            stationary = evec1 / evec1.sum()

            #eigs finds complex eigenvalues and eigenvectors, so you'll want the real part.
            pi_R = stationary.real

        # calculate bubble radius for all nodes, red nodes and blue nodes, save separately.
        topicPath = topic
        if isGraphDirected:
            topicPath = topic
        
        if not (typ==5) and not (typ==4) and not isGraphDirected:
            runtimeCentr, red_bubble_diameter, blue_bubble_diameter, bad_red_vertices, bad_blue_vertices = calculate_raduis(topicPath)  # comment if already computed
            bubble_diameter = load_bubble_diameter(topicPath, id_matrix_node, args.t)  # {5721464：5.933110367892977}
            red_bubble_diameter, blue_bubble_diameter, bad_red_vertices, bad_blue_vertices = get_bad_and_good_nodes(
                bubble_diameter, id_color, args.b, args.t)
            et = time.time()

            statisitcs = save_statisitcs()
            statisitcs["comps"] = comp_sizes
            fp = outPath + topicPath + '/statistics.pickle'
            with open(fp, 'wb') as f:
                pickle.dump(statisitcs, f)

            print ('------------------------')
            print (statisitcs)
            print('-------------------------')
        else:
            statisitcs = save_statisitcs_j()
            fpj = outPath + topicPath + '/statistics-dir.json'
            statisitcs["comps"] = comp_sizes
            with open(fpj, 'w') as fil:
                mystats = json.dump(statisitcs, fil, cls=NpEncoder)

        
        K = maxedges[idx]
        print('number of edges to add to graph is', K)
        print('Running PARITY')
        st = time.time()
        optAdditions, stat_pi = algoOpt(Adjacency, color_nodes, K, directed=isGraphDirected)
        et = time.time()
        set_R = set(R)
        set_B = set(B)
        for el in optAdditions:
            if el[0] not in set_R:
                print("ADDITION IS FROM BLUE)")
            if el[1] not in set_B:
                print("ADDITION IS TO R")
        elapsed_time = et - st
        print("RT-OPT", elapsed_time)
        optRes = GetScoresOpt(Adjacency, K, optAdditions, G_scc, pi_R)
        optRes["runtime"] = elapsed_time
        myresults = {"OPT":optRes}
        print(optRes["maxVec"])
        runtimes = []
        runtimesPR = []
        if isGraphDirected:
            for _ in range(iterations):
                st = time.time()
                optAdditions, stat_pi = algoOpt(Adjacency, color_nodes, K, directed=isGraphDirected, powerMethod=True)
                print("Statdistri", stat_pi[:20])
                et = time.time()
                st2 = time.time()
                optAdditionsPR, stat_PR = algoOpt(Adjacency, color_nodes, K, directed=isGraphDirected, powerMethod=True, pagerank=True)
                print("PRdistri", stat_PR[:20])
                et2 = time.time()
                elapsed_time = et - st
                elapsed_time2 = et2 - st2
                runtimes.append(elapsed_time)
                runtimesPR.append(elapsed_time2)
                print("RT-OPT-PM", elapsed_time)
            optRes1 = GetScoresOpt(Adjacency, K, optAdditions, G_scc, pi_R)
            optRes2 = GetScoresOpt(Adjacency, K, optAdditions, G_scc, stat_PR)
            optRes1["runtime-vec"] = runtimes
            optRes1["runtime-vec-PR"] = runtimesPR
            optRes1["runtime-PM"] = elapsed_time
            myresults["OPT-PM"]= optRes1
            myresults["OPT-PM-PR"]= optRes2
    
        if typ == 5 or typ == 4 or isGraphDirected:
            statisitcs = save_statisitcs_j()
            if typ ==5 or typ ==4:
                fpjj = outPath + topicPath + '/fullResBig.json'
            if isGraphDirected:
                fpjj = outPath + topicPath + '/fullResBig-dir.json'
            with open(fpjj, 'w') as fil:
                mystats = json.dump(myresults, fil, cls=NpEncoder)
            continue 

        # calculate candidate edges for ROV algorithm, save to pickle

        st = time.time()
        ROV_edges = compute_ROV_candidate_edge(data, G, A, node_id_matrix, id_matrix_node, args)
        et = time.time()
        rtROV = et - st
        with open(outPath + topicPath + '/rov_candidate_edges.pickle', 'wb') as f:
            pickle.dump(ROV_edges, f)
        #
        with open(outPath + topicPath + '/rov_candidate_edges.pickle', 'rb') as f:
            ROV_edges = pickle.load( f)

        #K = len(ROV_edges)
        
        nodes = np.array([node_id_matrix[n] for n in bad_red_vertices])
        alg = Algorithms(bad_red_vertices, blue_bubble_diameter, labels, args.t, color_nodes, r, nodes, node_id_matrix, list(G.edges()), ITER)

        st = time.time()
        baseline_edge = alg._compute_candidate_edge(algorithm='baseline',top_k=100,centrality=[])
        et = time.time()
        rtBL = et - st


        centrality = get_centralities(id_matrix_node, topicPath, 'red', args.t, old=False)  # {str id, centrality}
        st = time.time()
        top_k = int(len(centrality) / 100 * args.topk)
        RC_candidate_edges = alg._compute_candidate_edge('rand_central', top_k, centrality)
        et = time.time()
        rtRC = runtimeCentr+ (et - st)

        fpj = outPath + topicPath + '/statistics.json'
        statisitcs["Steady-dist-nodes"] = list(G_scc.nodes)
        statisitcs["Steady-dist-vec"] = pi_R
        if isGraphDirected:
            fpj = outPath + topicPath + '/statistics-dir.json'
        with open(fpj, 'w') as fil:
            mystats = json.dump(statisitcs, fil, cls=NpEncoder)

        st = time.time()
        WRC_candidate_edges = alg._compute_candidate_edge('w_rand_central', top_k, centrality, G)
        et = time.time()
        rtWRC = runtimeCentr + (et - st)


        st = time.time()
        REpublik_candidate_edges = alg._compute_candidate_edge('w_pen_central', top_k, centrality, G)
        REpublik_candidate_edges = REpublik_candidate_edges[:K]
        et = time.time()
        rtREP = runtimeCentr + (et - st)

        alg_edges = [baseline_edge, ROV_edges, RC_candidate_edges, WRC_candidate_edges, REpublik_candidate_edges]
        algorithms = ['baseline','ROV','RC','WRC','Reppublik','KDD']
        runtimes = [rtBL, rtROV, rtRC, rtWRC, rtREP]
        FULL_ALGS = ['baseline','ROV','RC','WRC','Reppublik','Greedy', 'OPT']
        if isGraphDirected:
            FULL_ALGS = ['baseline','ROV','RC','WRC','Reppublik', 'OPT']



        # visualization
        AVG = []
        MAX = []
        STEADY = []
        n = len(color_nodes)
        Red_int = [i for i in range(n) if color_nodes[i] == 'red']
        Blue_int = [i for i in range(n) if color_nodes[i] == 'blue']

        for i, algorithm in enumerate(algorithms[:-1]):
            edges = alg_edges[i]
            print (algorithm, 'len(edges)',len(edges))
            x_axis, avgHT, maxHT, steadyht = HittingTime_sample(Adjacency, edges, Red_int, Blue_int, color_nodes, algorithm, K, G_scc, pi_R)
            AVG.append(avgHT)
            MAX.append(maxHT)
            STEADY.append(steadyht)
            dictres = {"kvect":x_axis, "averages": avgHT, "maxVec":maxHT,"steadyVec":steadyht, "algo": algorithm, "runtime":runtimes[i]}
            myresults[algorithm] = dictres

        if not isGraphDirected:
            greedyres = KDD_visualization_exactgreedy(Adjacency, K, G_scc, pi_R)
            myresults["Greedy"] = greedyres
        myresults["All-Algos"] = FULL_ALGS
        myresults["Dataset"] = topic
        fpj = outPath + topicPath + '/fullRes.json'
        '''
        if isGraphDirected:
            fpj = outPath + topicPath + '/fullRes-dir.json'
        '''
        with open(fpj, 'w') as fil:
            mystats = json.dump(myresults, fil, cls=NpEncoder)
        print(myresults["OPT"])
        
        continue

        AVG.append(avgHT)
        MAX.append(maxHT)

        fp = outPath + topic + '/' + str(time.localtime().tm_hour) + '-' + str(time.localtime().tm_min) + '-AVG.pickle'
        with open(fp, 'wb') as f:
            pickle.dump(AVG,f)

        fp = outPath + topic + '/' + str(time.localtime().tm_hour) + '-' + str(time.localtime().tm_min) + '-MAX.pickle'
        with open(fp, 'wb') as f:
            pickle.dump(MAX,f)


        colormap = ['g', 'b', 'r', 'y', 'm', 'c']
        markermap = ['o', 'v', '^', '<', '>', 'x']

        # visualize average hitting time
        fig, ax = plt.subplots()

        for i in range(len(algorithms)):
            ax.plot(x_axis, AVG[i], color=colormap[i], marker=markermap[i], label=algorithms[i])

        plt.xlabel("k")
        plt.ylabel("objective value")
        legend = ax.legend(loc='upper center', shadow=False)

        plt.title(args.topic + ' avg hitting time')

        fig1 = plt.gcf()
        #plt.show()
        plt.draw()
        fig1.savefig(outPath + args.topic + ' avg hitting time')


        # visualize max hitting time
        fig, ax = plt.subplots()
        for i in range(len(algorithms)):
            ax.plot(x_axis, MAX[i], color=colormap[i], marker=markermap[i], label=algorithms[i])

        plt.xlabel("k")
        plt.ylabel("objective value")
        legend = ax.legend(loc='upper center', shadow=False)
        plt.title(args.topic + ' max hitting time')

        fig1 = plt.gcf()
        #plt.show()
        plt.draw()
        fig1.savefig(outPath + args.topic + ' max hitting time')
