{"cells":[{"cell_type":"code","execution_count":88,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":16406,"status":"ok","timestamp":1706618427794,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"vAmwpTNBOQAb","outputId":"a4b6a2ea-3a0e-4f64-b2ec-dadbcf37424b"},"outputs":[],"source":["#!pip install torch\n","#!pip install torch_geometric"]},{"cell_type":"code","execution_count":89,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":3488,"status":"ok","timestamp":1706618431277,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"9rWT6zzqOTUl","outputId":"e292796c-b0b7-432b-a75b-b5825ef8e87f"},"outputs":[],"source":["#from google.colab import drive\n","#drive.mount('/content/drive')"]},{"cell_type":"code","execution_count":90,"metadata":{"executionInfo":{"elapsed":10,"status":"ok","timestamp":1706618431277,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"dYVsmcYxOKae"},"outputs":[],"source":["r_global = 0.05\n","k_global = 0\n","dataset_global = \"Pubmed\"\n","\n","not_visited_set = [[100.0,0.001,1.0,0.001,0.01]]\n","\n","save_csv_files = 0\n","exp_iter = 10\n","detailed = 0"]},{"cell_type":"code","execution_count":91,"metadata":{"executionInfo":{"elapsed":9,"status":"ok","timestamp":1706618431277,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"wOwlhrzfOKap"},"outputs":[],"source":["from IPython.display import clear_output\n","from networkx.algorithms import community\n","from networkx.generators.community import random_partition_graph\n","from networkx.generators.community import stochastic_block_model\n","from networkx.generators.random_graphs import barabasi_albert_graph\n","from networkx.generators.random_graphs import erdos_renyi_graph\n","from networkx.generators.random_graphs import watts_strogatz_graph\n","from random import sample\n","from scipy.sparse import csgraph\n","from scipy.sparse import csr_matrix\n","from scipy.sparse import random\n","from scipy.sparse import random\n","from scipy.sparse.linalg import inv\n","from scipy.sparse.linalg import norm\n","from scipy.stats import rv_continuous\n","from sklearn.decomposition import FactorAnalysis\n","from torch import Tensor\n","from torch_geometric.datasets import Planetoid\n","from torch_geometric.datasets import DBLP\n","from torch_geometric.datasets import Coauthor\n","from torch_geometric.datasets import CitationFull\n","from torch_geometric.datasets import WebKB\n","from torch_geometric.nn import GCNConv\n","from torch_geometric.nn import GATConv\n","from torch_geometric.utils import dense_to_sparse,homophily\n","from torch_geometric.utils import to_dense_adj\n","from torch_geometric.utils import to_networkx\n","from tqdm import tqdm\n","import collections\n","import math\n","import matplotlib.pyplot as plt\n","import networkx as nx\n","import numpy as np\n","import os\n","os.environ['CUDA_VISIBLE_DEVICES'] = '-1'\n","import pandas as pd\n","#from pyswarm import pso\n","import scipy.sparse as sp\n","import seaborn as sns\n","import torch.nn.functional as F\n","import torch_geometric\n","import torch\n","import time\n","device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n","\n","\n","import gc"]},{"cell_type":"code","execution_count":92,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":9,"status":"ok","timestamp":1706618431277,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"WIlJvMpSOKas","outputId":"dd826512-c98a-45ba-c25c-23518a502142"},"outputs":[{"name":"stdout","output_type":"stream","text":["readings_path c:\\Users\\archi\\Desktop\\Research-Papers\\Archit's Code\\Visualization Chart/Pubmed/0.05\n","csv_path c:\\Users\\archi\\Desktop\\Research-Papers\\Archit's Code\\Visualization Chart/Pubmed/\n","Dataframe is being made.\n","Done\n"]}],"source":["#path = '/content/drive/My Drive/TEST TRAIN FGC with DELTA and APPNP/TEST TRAIN CS'\n","path = os.getcwd()\n","readings_path = path+\"/\"+dataset_global+\"/\"+str(r_global)\n","csv_path =  path+\"/\"+dataset_global+\"/\"\n","#check if dataframe exists\n","print(\"readings_path\",readings_path)\n","print(\"csv_path\",csv_path)\n","\n","try:\n","    df = pd.read_csv(readings_path+\"/parameter_readings_with_delta.csv\")\n","except:\n","    print(\"Dataframe is being made.\")\n","    df = pd.DataFrame(columns=['alpha_param','beta_param','gamma_param','lambda_param','delta_param','r','k','acc'])\n","    df.to_csv(readings_path+\"/parameter_readings_with_delta.csv\",index=False)\n","    print(\"Done\")\n","\n","def save_readings(alpha_param,beta_param,gamma_param,lambda_param,delta_param,r,k,acc):\n","    df = pd.read_csv(readings_path+'/'+'parameter_readings_with_delta.csv')\n","    df = df[df['acc']>=0]\n","    df = df.sort_values(by=['acc'])\n","    df.loc[len(df)] = [alpha_param,beta_param,gamma_param,lambda_param,delta_param,r,k,acc]\n","    df.to_csv(readings_path+'/'+'parameter_readings_with_delta.csv', index=False)\n","\n"]},{"cell_type":"code","execution_count":93,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":8,"status":"ok","timestamp":1706618431277,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"pNgX-krhOKav","outputId":"89347225-ac28-469a-d175-efeaa28e8f0a"},"outputs":[{"name":"stdout","output_type":"stream","text":["c:/Pubmed\n"]}],"source":["\n","device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n","data_dir = \"./data\"\n","os.makedirs(data_dir, exist_ok=True)\n","\n","\n","# In[26]:\n","\n","\n","os.getcwd()\n","dataset = os.path.join(os.getcwd(),'/'+dataset_global)\n","print(dataset)\n","\n","\n","# In[27]:\n","\n","if dataset_global in ['CS','Physics']:\n","    dataset = Coauthor(root='data/Coauthor',name=dataset_global)\n","elif dataset_global in ['Cora','Citeseer','Pubmed']:\n","    dataset = Planetoid(root='data/Planetoid',name=dataset_global)\n","elif dataset_global in ['DBLP']:\n","    dataset = CitationFull(root='data/DBLP',name='DBLP')\n","else:\n","    print(\"No Dataset Provided. Going with DBLP\")\n","    dataset = CitationFull(root='data/DBLP',name='DBLP')\n","#\n","    \n","#dataset = Planetoid(root='data/Planetoid',name=dataset_global)\n","\n","edge_list = dataset[0].edge_index\n","NO_OF_EDGES = edge_list.shape[1]\n","labels = dataset[0].y\n","\n","# print(\"Homophilic ratio : \" + str(homophily(edge_list,labels,method='edge')))\n","\n","\n","adj = to_dense_adj(dataset[0].edge_index)\n","adj = adj[0]\n","\n","labels = labels.numpy()\n","\n","X = dataset[0].x\n","X = X.to_dense()\n","N = X.shape[0]\n","NO_OF_CLASSES = len(set(labels))\n","\n","sparsity_original = 2*NO_OF_EDGES/(N*(N-1))\n","# print(\"Sparsity of original graph : \" + str(sparsity_original))\n","\n","nn = int(1*N)\n","X = X[:nn,:]\n","adj = adj[:nn,:nn]\n","labels = labels[:nn]\n","# print(X.shape,adj.shape)\n","\n","\n","\n","def get_laplacian(adj):\n","    b=torch.ones(adj.shape[0])\n","    return torch.diag(adj@b)-adj\n","\n","theta = get_laplacian(adj)\n","# print(theta.shape)\n","\n","\n","features = X.numpy()\n","NO_OF_NODES = X.shape[0]\n","\n","total_indices1 = torch.arange(NO_OF_NODES)\n","shuffled_indices1 = torch.randperm(total_indices1.numel())\n","train_mask = int(0.1 * total_indices1.numel())\n","#print(\"Train Mask\", train_mask)\n","\n","\n","def convertScipyToTensor(coo):\n","    try:\n","        coo = coo.tocoo()\n","    except:\n","        coo = coo\n","    values = coo.data\n","    indices = np.vstack((coo.row, coo.col))\n","\n","    i = torch.LongTensor(indices)\n","    v = torch.FloatTensor(values)\n","    shape = coo.shape\n","\n","    return torch.sparse.FloatTensor(i, v, torch.Size(shape))\n","\n","\n","from scipy.sparse import csr_matrix\n","from scipy.sparse import random\n","from scipy.sparse.linalg import norm\n","from scipy.stats import rv_continuous\n","\n","p = X.shape[0]\n","k = int(p*r_global)\n","k_global = int(p*r_global)\n","n = X.shape[1]\n","lambda_param = 100\n","beta_param = 50\n","alpha_param = 100\n","gamma_param = 100\n","lr = 1e-5\n","thresh = 1e-10\n","\n","\n","class CustomDistribution(rv_continuous):\n","    def _rvs(self,  size=None, random_state=None):\n","        return random_state.standard_normal(size)\n","temp = CustomDistribution(seed=1)\n","temp2 = temp()  # get a frozen version of the distribution\n","X_tilde = random(k, n, density=0.25, random_state=1, data_rvs=temp2.rvs)\n","C = random(p, k, density=0.25, random_state=1, data_rvs=temp2.rvs)"]},{"cell_type":"code","execution_count":94,"metadata":{"executionInfo":{"elapsed":7,"status":"ok","timestamp":1706618431277,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"2109w4xsOKax"},"outputs":[],"source":["test_mask = total_indices1.numel()"]},{"cell_type":"code","execution_count":95,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":7,"status":"ok","timestamp":1706618431277,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"17NDqxvdOKay","outputId":"6bde93d4-63fb-4eb9-f891-bdaffe07102a"},"outputs":[{"data":{"text/plain":["19717"]},"execution_count":95,"metadata":{},"output_type":"execute_result"}],"source":["total_indices1.numel()"]},{"cell_type":"markdown","metadata":{},"source":["# Extraction of csv files for visualization"]},{"cell_type":"markdown","metadata":{},"source":["### Feature Matrix"]},{"cell_type":"code","execution_count":96,"metadata":{},"outputs":[],"source":["if save_csv_files:\n","    # convert tensor to numpy array\n","    numpy_array = dataset[0].x.numpy()\n","    # save numpy array as CSV file\n","    np.savetxt(csv_path+'Feature_Matrix.csv', numpy_array, delimiter=',')"]},{"cell_type":"markdown","metadata":{},"source":["### Class Label Matrix"]},{"cell_type":"code","execution_count":97,"metadata":{},"outputs":[],"source":["def one_hot_encoded(x, class_count):\n","    return torch.eye(class_count)[x, :]\n","if save_csv_files:\n","    numpy_array = one_hot_encoded(dataset[0].y,NO_OF_CLASSES)# save the numpy array as a CSV file\n","    print(numpy_array)\n","    np.savetxt(csv_path+'Label_Matrix.csv', numpy_array, delimiter=',')"]},{"cell_type":"markdown","metadata":{},"source":["### Adjacency Matrix W"]},{"cell_type":"code","execution_count":98,"metadata":{},"outputs":[],"source":["if save_csv_files:\n","    # convert tensor to numpy array\n","    numpy_array = theta.numpy()\n","    # save numpy array as CSV file\n","    np.savetxt(csv_path+'Theta_Matrix.csv', numpy_array, delimiter=',')"]},{"cell_type":"code","execution_count":null,"metadata":{},"outputs":[],"source":[]},{"cell_type":"code","execution_count":null,"metadata":{},"outputs":[],"source":[]},{"cell_type":"code","execution_count":99,"metadata":{"executionInfo":{"elapsed":5,"status":"ok","timestamp":1706618431277,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"EPWYiXn7OKa0"},"outputs":[],"source":["#temp1 =int(labels.shape[0]*0.8)\n","#train_mask = labels[:temp1,]\n","\n","#test_mask ="]},{"cell_type":"code","execution_count":100,"metadata":{"executionInfo":{"elapsed":6,"status":"ok","timestamp":1706618431278,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"B89RXx11OKa1"},"outputs":[],"source":["def experiment(alpha_param,beta_param,gamma_param,lambda_param,delta_param,C,X_tilde,theta,X):\n","    p = X.shape[0]\n","    k = int(p*r_global)\n","    n = X.shape[1]\n","    ones = csr_matrix(np.ones((k,k)))\n","    ones = convertScipyToTensor(ones)\n","    ones = ones.to_dense()\n","    J = np.outer(np.ones(k), np.ones(k))/k\n","    J = csr_matrix(J)\n","    J = convertScipyToTensor(J)\n","    J = J.to_dense()\n","    zeros = csr_matrix(np.zeros((p,k)))\n","    zeros = convertScipyToTensor(zeros)\n","    zeros = zeros.to_dense()\n","    X_tilde = convertScipyToTensor(X_tilde)\n","    X_tilde = X_tilde.to_dense()\n","    C = convertScipyToTensor(C)\n","    C = C.to_dense()\n","    eye = torch.eye(k)\n","    try:\n","        theta = convertScipyToTensor(theta)\n","    except:\n","        theta = theta\n","    try:\n","        X = convertScipyToTensor(X)\n","        X = X.to_dense()\n","    except:\n","        X = X\n","\n","    def one_hot(x, class_count):\n","        return torch.eye(class_count)[x, :]\n","\n","    P = labels\n","    P = one_hot(P,NO_OF_CLASSES)\n","    P[train_mask,:]=0\n","    if(torch.cuda.is_available()):\n","        # print(\"yes\")\n","        X_tilde = X_tilde.cuda()\n","        C = C.cuda()\n","        theta = theta.cuda()\n","        X = X.cuda()\n","        J = J.cuda()\n","        P = P.cuda()\n","        zeros = zeros.cuda()\n","        ones = ones.cuda()\n","        eye = eye.cuda()\n","    def update(X_tilde,C,i):\n","        global L\n","        thetaC = theta@C\n","        CT = torch.transpose(C,0,1)\n","        X_tildeT = torch.transpose(X_tilde,0,1)\n","        CX_tilde = C@X_tilde\n","        t1 = CT@thetaC + J\n","        term_bracket = torch.linalg.pinv(t1)\n","        thetacX_tilde = thetaC@(X_tilde)\n","\n","        L = 1/k\n","\n","        t1 = -2*gamma_param*(thetaC@term_bracket)\n","        t2 = alpha_param*(CX_tilde-X)@(X_tildeT)\n","        t3 = 2*thetacX_tilde@(X_tildeT)\n","        t4 = lambda_param*(C@ones)\n","        t5 = 2*beta_param*(thetaC@CT@thetaC)\n","        t6 = delta_param*P@torch.transpose((CT@P),0,1)\n","        T2 = (t1+t2+t3+t4+t5+t6)/L\n","        Cnew = (C-T2).maximum(zeros)\n","        t1 = CT@thetaC*(2/alpha_param)\n","        t2 = CT@C\n","        t1 = torch.linalg.pinv(t1+t2)\n","        t1 = t1@CT\n","        t1 = t1@X\n","        X_tilde_new = t1\n","        Cnew[Cnew<thresh] = thresh\n","        for i in range(len(Cnew)):\n","            Cnew[i] = Cnew[i]/torch.linalg.norm(Cnew[i],1)\n","        for i in range(len(X_tilde_new)):\n","            X_tilde_new[i] = X_tilde_new[i]/torch.linalg.norm(X_tilde_new[i],1)\n","        return X_tilde_new,Cnew\n","\n","\n","    for i in tqdm(range(20)):\n","        X_tilde,C = update(X_tilde,C,i)\n","\n","    return X_tilde,C\n","\n"]},{"cell_type":"code","execution_count":101,"metadata":{"executionInfo":{"elapsed":5,"status":"ok","timestamp":1706618431278,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"ktw3SucLOKa3"},"outputs":[],"source":["class Net(torch.nn.Module):\n","    def __init__(self):\n","        super(Net, self).__init__()\n","        self.conv1 = GCNConv(X.shape[1], 64)\n","        self.conv2 = GCNConv(64, NO_OF_CLASSES)\n","\n","    def reset_parameters(self):\n","        self.conv1.reset_parameters()\n","        self.conv2.reset_parameters()\n","\n","    def forward(self, x, edge_index):\n","\n","        #print(\"Checking 1: x\", x.shape, \"Edge index:\", edge_index.shape)\n","        x = self.conv1(x, edge_index)\n","        #print(\"Checking 2: convolution done, new x:\", x.shape)\n","        x = F.relu(x)\n","        #print(\"Checking 3: x\", x.shape, \"training:\", self.training)\n","        x = F.dropout(x, training=self.training)\n","        #print(\"Checking 4: dropout done new x\", x.shape, \"Edge index:\", edge_index.shape)\n","        x = self.conv2(x, edge_index)\n","        #print(\"Checking 5: x\", x.shape)\n","\n","        return F.log_softmax(x, dim=1)"]},{"cell_type":"code","execution_count":102,"metadata":{"executionInfo":{"elapsed":5,"status":"ok","timestamp":1706618431278,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"5QV2he4UOKa5"},"outputs":[],"source":["from random import sample\n","from torch_geometric.utils import dense_to_sparse,homophily"]},{"cell_type":"code","execution_count":103,"metadata":{"executionInfo":{"elapsed":5,"status":"ok","timestamp":1706618431278,"user":{"displayName":"Archit Prasad Kane M.Tech., Computer Science & Engineering, IIT(BHU)","userId":"04470542112587312871"},"user_tz":-330},"id":"9v-h_G_KOKa6"},"outputs":[],"source":["def get_accuracy(C_0,L,X_t_0):\n","    gc.collect()\n","    global labels, NO_OF_CLASSES,k\n","    all_acc = []\n","    for i in [1,2]:\n","        C_0_new=np.zeros(C_0.shape)\n","        for i in range(C_0.shape[0]):\n","            C_0_new[i][np.argmax(C_0[i])]=1\n","        # print(\"C_0_new:\",C_0_new)\n","        # C_0_new=C_0\n","        from scipy import sparse\n","\n","        Lc=C_0_new.T@L@C_0_new\n","\n","        Wc=(-1*Lc)*(1-np.eye(Lc.shape[0]))\n","        Wc[Wc<0.1]=0\n","        Wc=sparse.csr_matrix(Wc)\n","        Wc = Wc.tocoo()\n","        row = torch.from_numpy(Wc.row).to(torch.long)\n","        col = torch.from_numpy(Wc.col).to(torch.long)\n","        edge_index_coarsen2 = torch.stack([row, col], dim=0)\n","\n","\n","        def one_hot(x, class_count):\n","            return torch.eye(class_count)[x, :]\n","\n","        device = torch.device('cpu')\n","\n","        Y = labels\n","\n","        Y = one_hot(Y,NO_OF_CLASSES)\n","        Y[train_mask, :] = 0\n","        # making Training dataset\n","        # Y[dataset[0].train_mask, :] = 0\n","\n","\n","\n","        P=np.linalg.pinv(C_0_new)\n","        labels_coarse = torch.argmax(torch.sparse.mm(torch.Tensor(P).double() , Y.double()).double() , 1)\n","\n","        Wc=Wc.toarray()\n","        adjtemp = torch.tensor(Wc)\n","        # edge_list_temp = dense_to_sparse(adjtemp)[0]\n","\n","        # print(\"Homophilic ratio : \" + str(homophily(edge_list_temp,labels_coarse,method='edge')))\n","        # number_of_edges = edge_list_temp.shape[1]\n","        # n = labels_coarse.shape[0]\n","        # sparsity = 2*number_of_edges/(n*(n-1))\n","        # print(\"Sparsity : \" + str(sparsity))\n","\n","  #\n","        # C2=np.linalg.pinv(C_0_new)\n","        model=Net().to(device)\n","        device = torch.device('cpu')\n","        lr=0.01\n","        decay=0.0001\n","        try:\n","            X=np.array(features.todense())\n","        except:\n","            X = np.array(features)\n","        #print(\"X:\",X.shape)\n","        optimizer = torch.optim.Adam(model.parameters(), lr=lr, weight_decay=decay)\n","        # criterion=torch.nn.CrossEntropyLoss()\n","        x=sample(range(0, int(k)), k)\n","\n","        from datetime import datetime\n","        Xt=P@X\n","        # Xt=X_t_0\n","        #########################################################  adding masks\n","        total_indices = torch.arange(k_global)\n","        shuffled_indices = torch.randperm(total_indices.numel())\n","        train_size = int(0.8 * total_indices.numel())\n","        train_indices = shuffled_indices[:train_size]\n","        val_size = int(0.2 * total_indices.numel())\n","        val_indices = shuffled_indices[train_size:train_size + val_size]\n","\n","        train_indices = shuffled_indices[:]\n","\n","        data = dataset[0].to(device)\n","\n","        coarsen_features = torch.Tensor(Xt).to(device)\n","        coarsen_train_labels = labels_coarse.to(device)\n","        coarsen_train_mask = train_indices.to(device)\n","        coarsen_val_labels = labels_coarse.to(device)\n","        coarsen_val_mask = val_indices.to(device)\n","        coarsen_edge = edge_index_coarsen2.to(device)\n","\n","        # print(\"Coarsen Data _trainpy\", data)\n","        # print(\"Coarsen feature _trainpy\", coarsen_features.shape)\n","        # print(\"Coarsen train_labels _trainpy\", coarsen_train_labels.shape)\n","        # print(\"Coarsen train_mask _trainpy\", coarsen_train_mask)\n","        # print(\"Coarsen train_mask _trainpy\", torch.sum(coarsen_train_mask))\n","        # print(\"Coarsen val_mask _trainpy\", torch.sum(coarsen_val_mask))\n","\n","\n","        # if args.normalize_features:\n","        #     coarsen_features = F.normalize(coarsen_features, p=1)\n","        #     data.x = F.normalize(data.x, p=1)\n","\n","        model.reset_parameters()\n","        optimizer = torch.optim.Adam(model.parameters(), lr=lr, weight_decay=0.0005)\n","        pathm = path +\"/Coarsening with Training, Tesing, Validation\"+\"/\"\n","        best_val_loss = float('inf')\n","        no_of_epochs = 500\n","        no_of_early_stopping = 10\n","        val_loss_history = []\n","        for epoch in range(no_of_epochs):\n","            model.train()\n","            optimizer.zero_grad()\n","            out = model(coarsen_features, coarsen_edge)\n","            loss = F.nll_loss(out[coarsen_train_mask], coarsen_train_labels[coarsen_train_mask])\n","            loss.backward()\n","            optimizer.step()\n","\n","            model.eval()\n","            pred = model(coarsen_features, coarsen_edge)\n","            val_loss = F.nll_loss(pred[coarsen_val_mask], coarsen_val_labels[coarsen_val_mask]).item()\n","\n","            if val_loss < best_val_loss and epoch > no_of_epochs // 2:\n","                best_val_loss = val_loss\n","                pathm = path +\"/Coarsening with Training, Tesing, Validation\"+\"/\"\n","                torch.save(model.state_dict(), pathm + 'checkpoint-best-acc.pkl')\n","\n","            val_loss_history.append(val_loss)\n","            if no_of_early_stopping  > 0 and epoch > no_of_epochs // 2:\n","                tmp = torch.Tensor(val_loss_history[-(no_of_early_stopping  + 1):-1])\n","                if val_loss > tmp.mean().item():\n","                    break\n","\n","\n","        model.load_state_dict(torch.load(pathm + 'checkpoint-best-acc.pkl'))\n","        model.eval()\n","        pred = model(data.x, data.edge_index).max(1)[1]\n","        #test_acc = int(pred[data.test_mask].eq(data.y[data.test_mask]).sum().item()) / int(data.test_mask.sum())\n","        test_acc = int(pred.eq(data.y).sum().item()) / int(test_mask)\n","        print(\"Test_acc\",f\"{test_acc:.4f}\")\n","        all_acc.append(test_acc)\n","\n","    print('ave_acc: {:.8f}'.format(np.mean(all_acc)), '+/- {:.8f}'.format(np.std(all_acc)))\n","    gc.collect()\n","    return np.mean(all_acc)\n","\n"]},{"cell_type":"code","execution_count":104,"metadata":{"colab":{"background_save":true,"base_uri":"https://localhost:8080/"},"id":"PCfnmklFOKa7"},"outputs":[{"name":"stdout","output_type":"stream","text":["\n","------\t Pubmed \t 0.05 \t 0 | 1 \t------\n","100.0 0.001 1.0 0.001 0.01\n"]},{"name":"stderr","output_type":"stream","text":[" 45%|████▌     | 9/20 [02:44<03:28, 18.96s/it]"]}],"source":["def getSparsityAndHomophily(C,theta):\n","    theta = C.T@theta@C\n","    adjtemp = -theta\n","    for i in range(adjtemp.shape[0]):\n","        adjtemp[i,i]=0\n","    adjtemp[adjtemp<0.01]=0\n","    temp = dense_to_sparse(adjtemp)\n","    edge_list_temp = temp[0]\n","    # ytemp = temp[1]\n","    # P = torch.linalg.pinv(C)\n","    # labels =\n","    # # print(edge_list)\n","    number_of_edges = edge_list_temp.shape[1]\n","    # n = adjtemp.shape[0]\n","\n","    # print(\"Homophilic ratio : \" + str(homophily(edge_list_temp,ytemp,method='node')))\n","    # sparsity = 2*number_of_edges/(n*(n-1))\n","    # print(\"Sparsity : \" + str(sparsity))\n","\n","\n","\n","def fitness_function(alpha_param,beta_param,gamma_param,lambda_param,delta_param):\n","    print(alpha_param,beta_param,gamma_param,lambda_param,delta_param)\n","    start = time.time()\n","    #alpha_param,beta_param,gamma_param,lambda_param,delta_param = temp_param\n","    X_tilde = random(k, n, density=0.15, random_state=1, data_rvs=temp2.rvs)\n","    C = random(p, k, density=0.15, random_state=1, data_rvs=temp2.rvs)\n","    X_t_0,C_0 = experiment(alpha_param,beta_param,gamma_param,lambda_param,delta_param,C,X_tilde,theta,X)\n","    L = theta\n","    #getSparsityAndHomophily(C_0,theta)\n","\n","    C_0 = C_0.cpu().detach().numpy()\n","    X_t_0 = X_t_0.cpu().detach().numpy()\n","    try:\n","        L = L.cpu().detach().numpy()\n","    except:\n","        L = L\n","    acc = get_accuracy(C_0,L,X_t_0)\n","    #readings_path \n","    end = time.time()\n","    print(\"Time Taken:\\t\",end-start)\n","    if save_csv_files:\n","        np.savetxt(readings_path+'//Coarsening_Matrix_With_Delta.csv', C_0, delimiter=',')\n","#here\n","\n","    return acc\n","\n","\n","\n","not_visited_set = set(map(tuple,not_visited_set))\n","\n","# ,0.001,0.01,0.1,1,10,100,1000\n","highest_acc = 0\n","for index,s in enumerate(not_visited_set):\n","    gc.collect()\n","    try:\n","      print(\"\\n------\\t\",dataset_global,\"\\t\",r_global,\"\\t\",index,\"|\",len(not_visited_set),\"\\t------\")\n","      alpha_param,beta_param,gamma_param,lambda_param,delta_param = s\n","\n","      acc = fitness_function(alpha_param,beta_param,gamma_param,lambda_param,delta_param)\n","      if acc >highest_acc:\n","          highest_acc =acc\n","      save_readings(alpha_param,beta_param,gamma_param,lambda_param,delta_param,r_global,k_global,acc)\n","      gc.collect()\n","    except Exception as e:\n","        print(e)\n","\n","\n"]},{"cell_type":"markdown","metadata":{},"source":[]},{"cell_type":"code","execution_count":null,"metadata":{"id":"H1oDxwRhOKa9"},"outputs":[],"source":[]}],"metadata":{"colab":{"name":"","version":""},"kernelspec":{"display_name":"Python 3","language":"python","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.10.6"}},"nbformat":4,"nbformat_minor":0}
