{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "7aef67b1",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Using backend: pytorch\n",
      "Intel(R) Extension for Scikit-learn* enabled (https://github.com/intel/scikit-learn-intelex)\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.append('..')\n",
    "\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import os\n",
    "import math\n",
    "import torch\n",
    "import dgl\n",
    "import numpy_ml\n",
    "import torch.nn.functional as F\n",
    "import tensorflow.compat.v1 as tf\n",
    "import scipy\n",
    "import cupy as cp\n",
    "import cupyx\n",
    "\n",
    "from dgl import function as fn\n",
    "from dgl.base import DGLError\n",
    "from generate_mid_layer_feature import FeatureExtraction\n",
    "from sklearn.linear_model import LogisticRegression\n",
    "from scipy.special import softmax, log_softmax\n",
    "from numpy.linalg import inv, pinv\n",
    "from sklearn.preprocessing import OneHotEncoder\n",
    "from sklearn.metrics import log_loss\n",
    "from sklearn.preprocessing import LabelBinarizer\n",
    "from sklearn.utils import check_array\n",
    "from dataset import load_graph_dataset\n",
    "from sklearn.datasets import load_iris\n",
    "from sklearn.model_selection import train_test_split\n",
    "\n",
    "from model_node_influence import NodeInfluenceSGC\n",
    "\n",
    "from model_softmax import SimplifiedGraphNeuralNetwork, fast_hess, fast_hess_cuda, fast_get_inv_hvp_cuda\n",
    "\n",
    "from matplotlib import pyplot as plt\n",
    "from scipy.linalg import cho_solve, cho_factor\n",
    "from model_edge_influence import EdgeInfluenceSGC, generate_remove_index_train\n",
    "from tqdm import tqdm\n",
    "import networkx as nx"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "32d8a19f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'/home/zizhang/Desktop/Projects/Project6_influence_function/graph_influence_function/experiments'"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "os.getcwd()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "67a6cc76",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Intel(R) Extension for Scikit-learn* enabled (https://github.com/intel/scikit-learn-intelex)\n"
     ]
    }
   ],
   "source": [
    "from sklearnex import patch_sklearn, config_context\n",
    "patch_sklearn()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "84907b0d",
   "metadata": {},
   "outputs": [],
   "source": [
    "data_set = 'cora'\n",
    "# l2_term = 0.01\n",
    "l2_term = 0.01\n",
    "# batch_edges = 1\n",
    "num_layer = 2\n",
    "\n",
    "# data_set = 'pubmed'\n",
    "# l2_term = 0.004\n",
    "# num_layer = 2\n",
    "\n",
    "# data_set = 'citeseer'\n",
    "# l2_term = 0.003\n",
    "# num_layer = 2\n",
    "\n",
    "# data_set = 'reddit'\n",
    "# l2_term = 0.99\n",
    "# num_layer = 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "12c21f96",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "  NumNodes: 2708\n",
      "  NumEdges: 10556\n",
      "  NumFeats: 1433\n",
      "  NumClasses: 7\n",
      "  NumTrainingSamples: 140\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n"
     ]
    }
   ],
   "source": [
    "graph, feat, labels, train_mask, val_mask, test_mask, number_classes = load_graph_dataset(data_set)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "25c35dc3",
   "metadata": {},
   "outputs": [],
   "source": [
    "feat0 = feat.clone()\n",
    "degs = graph.in_degrees().float().clamp(min = 1)\n",
    "norm = torch.pow(degs, -0.5)\n",
    "norm = norm.to(feat0.device).unsqueeze(1)\n",
    "\n",
    "for _ in range(num_layer):\n",
    "    feat0 = feat0 * norm\n",
    "    graph.ndata['h'] = feat0\n",
    "    graph.update_all(fn.copy_u('h', 'm'),\n",
    "                     fn.sum('m', 'h'))\n",
    "    feat0 = graph.ndata.pop('h')\n",
    "    feat0 = feat0 * norm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "eaf065ae",
   "metadata": {},
   "outputs": [],
   "source": [
    "train_x = feat0[train_mask].numpy().astype(np.float32)\n",
    "train_y = labels[train_mask].numpy().astype(np.float32)\n",
    "\n",
    "test_x = feat0[test_mask].numpy().astype(np.float32)\n",
    "test_y = labels[test_mask].numpy().astype(np.float32)\n",
    "\n",
    "val_x = feat0[val_mask].numpy().astype(np.float32)\n",
    "val_y = labels[val_mask].numpy().astype(np.float32)\n",
    "\n",
    "train_node_idx = torch.where(train_mask == 1)[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "fd1a7cd6",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "' Train Logistic Regression '"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "enc = OneHotEncoder(handle_unknown='ignore')\n",
    "enc.fit(train_y.reshape(-1, 1))\n",
    "\n",
    "one_hot_labels_train = enc.transform(train_y.reshape(-1, 1)).toarray()\n",
    "one_hot_labels_test = enc.transform(test_y.reshape(-1, 1)).toarray()\n",
    "one_hot_labels_val = enc.transform(val_y.reshape(-1, 1)).toarray()\n",
    "\"\"\" Train Logistic Regression \"\"\"\n",
    "# lr = SimplifiedGraphNeuralNetwork(l2_reg=l2_term, fit_intercept=True)\n",
    "# lr.fit(train_x, train_y, sample_weight=None, verbose=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "2c7e5064",
   "metadata": {},
   "outputs": [],
   "source": [
    "def generate_remove_index_train_all(from_indexes, to_indexes, train_mask, seed_val=10):\n",
    "    torch.manual_seed(seed_val)\n",
    "    train_index = torch.where(train_mask == 1)[0]\n",
    "    remove_from_list = []\n",
    "    remove_to_list = []\n",
    "    for i in tqdm(range(len(train_index))):\n",
    "        f_index = train_index[i]\n",
    "\n",
    "        to_index_list = torch.where(from_indexes == f_index)[0]\n",
    "        \n",
    "#         print(f_index)\n",
    "#         random_index = torch.randint(0, len(to_index_list), (1,))[0]\n",
    "        for to_index_e in to_index_list:\n",
    "#             print(to_index_list)\n",
    "#             print(to_index_e.item())\n",
    "#             j = to_index_list[to_index_e[0]]\n",
    "            j = to_index_e\n",
    "            t_index = to_indexes[j]\n",
    "\n",
    "            remove_from_list.append(f_index)\n",
    "            remove_to_list.append(t_index)\n",
    "\n",
    "    return torch.tensor(remove_from_list), torch.tensor(remove_to_list)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "300d906b",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████████████████████████████████| 140/140 [00:00<00:00, 20896.14it/s]\n"
     ]
    }
   ],
   "source": [
    "from_indexes, to_indexes = graph.edges()\n",
    "\n",
    "f_l, t_l = generate_remove_index_train_all(from_indexes, to_indexes, train_mask)\n",
    "f_l, t_l = from_indexes, to_indexes\n",
    "\n",
    "# acctual_influence_1 = []\n",
    "# acctual_influence_2 = []\n",
    "\n",
    "# predict_influence_1 = []\n",
    "# predict_influence_2 = []\n",
    "\n",
    "# df = pd.read_csv('result_data/' + data_set + '_edge_influence.csv', header = None)\n",
    "# df = df.loc[df[0] != 0]\n",
    "# f_l = torch.tensor(df[2].values.astype(int))\n",
    "# t_l = torch.tensor(df[3].values.astype(int))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "6972b1d8",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# split_side = int(len(f_l) / batch_edges)\n",
    "# total_edges = np.arange(len(f_l))\n",
    "# np.random.shuffle(total_edges)\n",
    "# new_index = np.array_split(total_edges, split_side)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "5b05a0e3",
   "metadata": {},
   "outputs": [],
   "source": [
    "changed_list = []\n",
    "changed_list_change = []"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "838dfe71",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|████████████████████████████████████████| 139/139 [00:00<00:00, 210.49it/s]\n"
     ]
    }
   ],
   "source": [
    "# convert to one-hot labels\n",
    "enc = OneHotEncoder(handle_unknown='ignore')\n",
    "enc.fit(train_y.reshape(-1, 1))\n",
    "one_hot_labels_train_orig = enc.transform(train_y.reshape(-1, 1)).toarray()\n",
    "\n",
    "one_hot_labels_val = enc.transform(val_y.reshape(-1, 1)).toarray()\n",
    "\n",
    "# train the original data\n",
    "# calculate the hessian matrix\n",
    "lr_origin = SimplifiedGraphNeuralNetwork(l2_reg=l2_term, fit_intercept=True)\n",
    "\n",
    "lr_origin.fit(train_x, train_y, sample_weight=None, verbose=False)\n",
    "\n",
    "logits_val_y_origin = val_x @ lr_origin.model.coef_.T + lr_origin.model.intercept_\n",
    "\n",
    "logits_train_y_origin = train_x @ lr_origin.model.coef_.T + lr_origin.model.intercept_\n",
    "\n",
    "ori_val_loss, ave_ori_val_loss = lr_origin.log_loss(logits_val_y_origin, one_hot_labels_val, l2_reg=True)\n",
    "\n",
    "# numpy_theoritic_loss = log_loss(val_y, softmax(logits_val_y_origin, axis=1))\n",
    "\n",
    "# assert np.allclose(numpy_theoritic_loss, ave_ori_val_loss)\n",
    "\n",
    "val_loss_total_grad_orig, val_loss_indiv_grad_orig = lr_origin.grad(val_x, \n",
    "                                                                    logits_val_y_origin,\n",
    "                                                                    one_hot_labels_val, l2_reg = True)\n",
    "\n",
    "hess = lr_origin.hess_cuda(train_x, logits_train_y_origin, l2_reg = True)\n",
    "\n",
    "\n",
    "###### write out hessian matrix\n",
    "\n",
    "# hess = cp.asnumpy(hess)\n",
    "\n",
    "# pd.DataFrame(hess).to_csv(\"reddit/hess.csv\", index = False)\n",
    "\n",
    "######\n",
    "\n",
    "\n",
    "loss_grad_hvp = fast_get_inv_hvp_cuda(hess, val_loss_total_grad_orig.T, cholskey=True)\n",
    "\n",
    "loss_grad_hvp = cp.asnumpy(loss_grad_hvp)\n",
    "del hess"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "67f2a7f9",
   "metadata": {},
   "outputs": [],
   "source": [
    "# # convert to one-hot labels\n",
    "# enc = OneHotEncoder(handle_unknown='ignore')\n",
    "# enc.fit(train_y.reshape(-1, 1))\n",
    "# one_hot_labels_train_orig = enc.transform(train_y.reshape(-1, 1)).toarray()\n",
    "\n",
    "# one_hot_labels_test = enc.transform(test_y.reshape(-1, 1)).toarray()\n",
    "\n",
    "# # train the original data\n",
    "# # calculate the hessian matrix\n",
    "# lr_origin = SimplifiedGraphNeuralNetwork(l2_reg=l2_term, fit_intercept=True)\n",
    "\n",
    "# lr_origin.fit(train_x, train_y, sample_weight=None, verbose=False)\n",
    "\n",
    "# logits_test_y_origin = test_x @ lr_origin.model.coef_.T + lr_origin.model.intercept_\n",
    "\n",
    "# logits_train_y_origin = train_x @ lr_origin.model.coef_.T + lr_origin.model.intercept_\n",
    "\n",
    "# ori_val_loss, ave_ori_val_loss = lr_origin.log_loss(logits_test_y_origin, one_hot_labels_test, l2_reg=True)\n",
    "\n",
    "# # numpy_theoritic_loss = log_loss(test_y, softmax(logits_test_y_origin, axis=1))\n",
    "\n",
    "# # assert np.allclose(numpy_theoritic_loss, ave_ori_val_loss)\n",
    "\n",
    "# val_loss_total_grad_orig, val_loss_indiv_grad_orig = lr_origin.grad(test_x, \n",
    "#                                                                     logits_test_y_origin,\n",
    "#                                                                     one_hot_labels_test, l2_reg = True)\n",
    "\n",
    "# hess = lr_origin.hess_cuda(train_x, logits_train_y_origin, l2_reg = True)\n",
    "\n",
    "# loss_grad_hvp = fast_get_inv_hvp_cuda(hess, val_loss_total_grad_orig.T, cholskey=True)\n",
    "\n",
    "# loss_grad_hvp = cp.asnumpy(loss_grad_hvp)\n",
    "# del hess"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "9b21fc08",
   "metadata": {},
   "source": [
    "##### comment here"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "1fe1198d",
   "metadata": {},
   "outputs": [],
   "source": [
    "# acctual_influence_1 = []\n",
    "# acctual_influence_2 = []\n",
    "\n",
    "# predict_influence_1 = []\n",
    "# predict_influence_2 = []\n",
    "\n",
    "# # for k in tqdm(range(len(train_node_idx))):\n",
    "# for k in tqdm(range(len(f_l))):\n",
    "# # for k in tqdm(range(len(new_index))):\n",
    "# #     eis = EdgeInfluenceSGC(graph=graph, feature=feat, from_index=f_l[new_index[k]], to_index=t_l[new_index[k]])\n",
    "# #     eis.remove_edges_sgc_from_influence()\n",
    "#     eis = EdgeInfluenceSGC(graph=graph, feature=feat, from_index=f_l[k], to_index=t_l[k])\n",
    "#     eis.remove_edges_sgc_from_influence()\n",
    "#     feat_removed1 = eis.calculate_modified_features()\n",
    "    \n",
    "# #     node_id = train_node_idx.numpy()[k]\n",
    "# #     nis = NodeInfluenceSGC(graph = graph, feature=feat, node_index=node_id)\n",
    "# #     nis.remove_edges_sgc()\n",
    "# #     feat_removed1 = nis.calculate_modified_features()\n",
    "\n",
    "#     extra_index = torch.unique(torch.where(feat0 != feat_removed1)[0])\n",
    "    \n",
    "    \n",
    "#     extra_index_train = torch.tensor(\n",
    "#         [extra_index[i] for i in range(len(extra_index)) if extra_index[i] in train_node_idx]).numpy()\n",
    "    \n",
    "#     extra_index_train_in_train = [\n",
    "#         np.where(train_node_idx.numpy() == extra_index_train[j])[0][0] for j in range(len(extra_index_train))]\n",
    "    \n",
    "#     if extra_index_train == []:\n",
    "#         predict_influence_1.append(0.0)\n",
    "#         acctual_influence_1.append(0.0)\n",
    "#         continue\n",
    "    \n",
    "#     feat_to_be_added = feat_removed1[extra_index_train].numpy()\n",
    "#     perturb_index = extra_index_train_in_train\n",
    "    \n",
    "    \n",
    "#     train_x_new = feat_to_be_added\n",
    "#     train_y_new = train_y[perturb_index]\n",
    "    \n",
    "#     train_x_orig = np.concatenate([train_x, train_x_new])\n",
    "#     train_y_orig = np.concatenate([train_y, train_y_new])\n",
    "    \n",
    "#     one_hot_labels_train_0 = enc.transform(train_y_orig.reshape(-1, 1)).toarray()\n",
    "#     logits_train_y_origin_0 = train_x_orig @ lr_origin.model.coef_.T + lr_origin.model.intercept_\n",
    "\n",
    "#     train_total_grad_orig, train_indiv_grad_orig = lr_origin.grad(train_x_orig, \n",
    "#                                             logits_train_y_origin_0, \n",
    "#                                             one_hot_labels_train_0, l2_reg = True)\n",
    "    \n",
    "    \n",
    "#     pred_infl = train_indiv_grad_orig.dot(loss_grad_hvp)\n",
    "    \n",
    "    \n",
    "    \n",
    "    \n",
    "# #     weight_orig = np.ones(len(train_x_orig)) # 1...1...11\n",
    "    \n",
    "# #     weight_1 = np.ones(len(train_x_orig))\n",
    "# #     weight_1[len(train_x_orig) - len(perturb_index):] = 0 # 1...1...10\n",
    "    \n",
    "# #     weight_2 = np.ones(len(train_x_orig))\n",
    "# #     weight_2[len(train_x_orig) - len(perturb_index):] = 0 \n",
    "# #     weight_2[perturb_index] = 0 # 1...0...10\n",
    "    \n",
    "#     weight_3 = np.ones(len(train_x_orig))\n",
    "#     weight_3[perturb_index] = 0 # 1...0...11\n",
    "    \n",
    "# #     lr_new_1 = SimplifiedGraphNeuralNetwork(l2_reg=1.0, fit_intercept=True)\n",
    "# #     train_x_delete_1 = train_x_orig[weight_1 == 1]\n",
    "# #     train_y_delete_1 = train_y_orig[weight_1 == 1]\n",
    "    \n",
    "# #     assert(np.allclose(train_x_delete_1, train_x))\n",
    "# #     assert(np.allclose(train_y_delete_1, train_y))\n",
    "    \n",
    "# #     lr_new_1.fit(train_x_delete_1, train_y_delete_1)\n",
    "# #     logits_val_y_new_1 = val_x @ lr_new_1.model.coef_.T + lr_new_1.model.intercept_\n",
    "# #     new_ori_val_loss_1, _ = lr_new_1.log_loss(logits_val_y_new_1, one_hot_labels_val)\n",
    "    \n",
    "    \n",
    "    \n",
    "#     lr_new_2 = SimplifiedGraphNeuralNetwork(l2_reg=l2_term, fit_intercept=True)\n",
    "#     train_x_delete_2 = train_x_orig[weight_3 == 1]\n",
    "#     train_y_delete_2 = train_y_orig[weight_3 == 1]\n",
    "    \n",
    "#     lr_new_2.fit(train_x_delete_2, train_y_delete_2)\n",
    "#     logits_val_y_new_2 = val_x @ lr_new_2.model.coef_.T + lr_new_2.model.intercept_\n",
    "#     new_ori_val_loss_2, _ = lr_new_2.log_loss(logits_val_y_new_2, one_hot_labels_val, l2_reg = True)\n",
    "    \n",
    "#     predict_influence_1.append(np.sum(pred_infl[perturb_index]) - np.sum(pred_infl[len(train_x):]))\n",
    "#     acctual_influence_1.append(new_ori_val_loss_2 - ori_val_loss)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "917bea0d",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|█████████████████████████████████████| 13264/13264 [15:44<00:00, 14.04it/s]\n"
     ]
    }
   ],
   "source": [
    "acctual_influence_1 = []\n",
    "acctual_influence_2 = []\n",
    "\n",
    "predict_influence_1 = []\n",
    "predict_influence_2 = []\n",
    "\n",
    "# for k in tqdm(range(len(train_node_idx))):\n",
    "for k in tqdm(range(len(f_l))):\n",
    "# for k in tqdm(range(len(new_index))):\n",
    "#     eis = EdgeInfluenceSGC(graph=graph, feature=feat, from_index=f_l[new_index[k]], to_index=t_l[new_index[k]])\n",
    "#     eis.remove_edges_sgc_from_influence()\n",
    "    eis = EdgeInfluenceSGC(graph=graph, feature=feat, from_index=f_l[k], to_index=t_l[k])\n",
    "    eis.remove_edges_sgc_from_influence()\n",
    "    feat_removed1 = eis.calculate_modified_features()\n",
    "    \n",
    "#     node_id = train_node_idx.numpy()[k]\n",
    "#     nis = NodeInfluenceSGC(graph = graph, feature=feat, node_index=node_id)\n",
    "#     nis.remove_edges_sgc()\n",
    "#     feat_removed1 = nis.calculate_modified_features()\n",
    "\n",
    "    extra_index = torch.unique(torch.where(feat0 != feat_removed1)[0])\n",
    "    \n",
    "    \n",
    "    extra_index_train = torch.tensor(\n",
    "        [extra_index[i] for i in range(len(extra_index)) if extra_index[i] in train_node_idx]).numpy()\n",
    "    \n",
    "    extra_index_train_in_train = [\n",
    "        np.where(train_node_idx.numpy() == extra_index_train[j])[0][0] for j in range(len(extra_index_train))]\n",
    "    \n",
    "    if extra_index_train == []:\n",
    "        predict_influence_1.append(0.0)\n",
    "        acctual_influence_1.append(0.0)\n",
    "        continue\n",
    "#     print(extra_index_train)\n",
    "    feat_to_be_added = feat_removed1[extra_index_train].numpy()\n",
    "    perturb_index = extra_index_train_in_train\n",
    "    \n",
    "    if perturb_index == []:\n",
    "        predict_influence_1.append(0.0)\n",
    "        acctual_influence_1.append(0.0)\n",
    "        continue\n",
    "    \n",
    "    train_x_new = feat_to_be_added\n",
    "    train_y_new = train_y[perturb_index]\n",
    "    \n",
    "    train_x_orig = np.concatenate([train_x, train_x_new])\n",
    "    train_y_orig = np.concatenate([train_y, train_y_new])\n",
    "    \n",
    "    one_hot_labels_train_0 = enc.transform(train_y_orig.reshape(-1, 1)).toarray()\n",
    "    logits_train_y_origin_0 = train_x_orig @ lr_origin.model.coef_.T + lr_origin.model.intercept_\n",
    "    \n",
    "    \n",
    "    train_x_orig_col_sum_before = train_x_orig\n",
    "    \n",
    "    \n",
    "    x1_train_before = train_x_orig[perturb_index]\n",
    "    y_logits_train_before = logits_train_y_origin_0[perturb_index]\n",
    "    y_one_hot_labels_train_before = one_hot_labels_train_0[perturb_index]\n",
    "    \n",
    "    l1 = lr_origin.grad_sum(x1_train_before, y_logits_train_before, \n",
    "                            y_one_hot_labels_train_before, l2_reg = True)\n",
    "    \n",
    "    \n",
    "    x1_train_after = train_x_orig[len(train_x):]\n",
    "    y_logits_train_after = logits_train_y_origin_0[len(train_x):]\n",
    "    y_one_hot_labels_train_after = one_hot_labels_train_0[len(train_x):]\n",
    "\n",
    "    l2 = lr_origin.grad_sum(x1_train_after, y_logits_train_after, \n",
    "                            y_one_hot_labels_train_after, l2_reg = True)\n",
    "    \n",
    "#     train_total_grad_orig, train_indiv_grad_orig = lr_origin.grad(train_x_orig, \n",
    "#                                             logits_train_y_origin_0, \n",
    "#                                             one_hot_labels_train_0, l2_reg = True)\n",
    "    \n",
    "    l1 = l1.dot(loss_grad_hvp)[0][0]\n",
    "    l2 = l2.dot(loss_grad_hvp)[0][0]\n",
    "#     pred_infl = train_indiv_grad_orig.dot(loss_grad_hvp)\n",
    "    \n",
    "    \n",
    "    \n",
    "    \n",
    "    weight_3 = np.ones(len(train_x_orig))\n",
    "    weight_3[perturb_index] = 0 # 1...0...11\n",
    "    \n",
    "    \n",
    "    lr_new_2 = SimplifiedGraphNeuralNetwork(l2_reg=l2_term, fit_intercept=True)\n",
    "    train_x_delete_2 = train_x_orig[weight_3 == 1]\n",
    "    train_y_delete_2 = train_y_orig[weight_3 == 1]\n",
    "    \n",
    "    lr_new_2.fit(train_x_delete_2, train_y_delete_2)\n",
    "    logits_val_y_new_2 = val_x @ lr_new_2.model.coef_.T + lr_new_2.model.intercept_\n",
    "    new_ori_val_loss_2, _ = lr_new_2.log_loss(logits_val_y_new_2, one_hot_labels_val, l2_reg = True)\n",
    "    \n",
    "#     predict_influence_1.append(np.sum(pred_infl[perturb_index]) - np.sum(pred_infl[len(train_x):]))\n",
    "    predict_influence_1.append(l1 - l2)\n",
    "    acctual_influence_1.append(new_ori_val_loss_2 - ori_val_loss)\n",
    "#     pd.DataFrame([predict_influence_1, acctual_influence_1]).T.to_csv('reddit/reddit_edge_influence.csv', header = None)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "1b6a81e7",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([], dtype=float32)"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "extra_index_train"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "4d27c03b",
   "metadata": {},
   "outputs": [],
   "source": [
    "# acctual_influence_1 = []\n",
    "# acctual_influence_2 = []\n",
    "\n",
    "# predict_influence_1 = []\n",
    "# predict_influence_2 = []\n",
    "\n",
    "# # for k in tqdm(range(len(train_node_idx))):\n",
    "# for k in tqdm(range(len(f_l))):\n",
    "\n",
    "#     eis = EdgeInfluenceSGC(graph=graph, feature=feat, from_index=f_l[k], to_index=t_l[k])\n",
    "#     eis.remove_edges_sgc()\n",
    "#     feat_removed1 = eis.calculate_modified_features()\n",
    "    \n",
    "# #     node_id = train_node_idx.numpy()[k]\n",
    "# #     nis = NodeInfluenceSGC(graph = graph, feature=feat, node_index=node_id)\n",
    "# #     nis.remove_edges_sgc()\n",
    "# #     feat_removed1 = nis.calculate_modified_features()\n",
    "\n",
    "#     extra_index = torch.unique(torch.where(feat0 != feat_removed1)[0])\n",
    "    \n",
    "    \n",
    "#     extra_index_train = torch.tensor(\n",
    "#         [extra_index[i] for i in range(len(extra_index)) if extra_index[i] in train_node_idx]).numpy()\n",
    "    \n",
    "#     extra_index_train_in_train = [\n",
    "#         np.where(train_node_idx.numpy() == extra_index_train[j])[0][0] for j in range(len(extra_index_train))]\n",
    "    \n",
    "#     if extra_index_train != []:\n",
    "#         predict_influence_1.append(0.0)\n",
    "#         acctual_influence_1.append(0.0)\n",
    "#         continue\n",
    "    \n",
    "#     feat_to_be_added = feat_removed1[extra_index_train].numpy()\n",
    "#     perturb_index = extra_index_train_in_train\n",
    "    \n",
    "    \n",
    "#     train_x_new = feat_to_be_added\n",
    "#     train_y_new = train_y[perturb_index]\n",
    "    \n",
    "#     train_x_orig = np.concatenate([train_x, train_x_new])\n",
    "#     train_y_orig = np.concatenate([train_y, train_y_new])\n",
    "    \n",
    "#     one_hot_labels_train_0 = enc.transform(train_y_orig.reshape(-1, 1)).toarray()\n",
    "#     logits_train_y_origin_0 = train_x_orig @ lr_origin.model.coef_.T + lr_origin.model.intercept_\n",
    "\n",
    "#     train_total_grad_orig, train_indiv_grad_orig = lr_origin.grad(train_x_orig, \n",
    "#                                             logits_train_y_origin_0, \n",
    "#                                             one_hot_labels_train_0, l2_reg = True)\n",
    "    \n",
    "    \n",
    "#     pred_infl = train_indiv_grad_orig.dot(loss_grad_hvp)\n",
    "    \n",
    "    \n",
    "    \n",
    "    \n",
    "# #     weight_orig = np.ones(len(train_x_orig)) # 1...1...11\n",
    "    \n",
    "# #     weight_1 = np.ones(len(train_x_orig))\n",
    "# #     weight_1[len(train_x_orig) - len(perturb_index):] = 0 # 1...1...10\n",
    "    \n",
    "# #     weight_2 = np.ones(len(train_x_orig))\n",
    "# #     weight_2[len(train_x_orig) - len(perturb_index):] = 0 \n",
    "# #     weight_2[perturb_index] = 0 # 1...0...10\n",
    "    \n",
    "#     weight_3 = np.ones(len(train_x_orig))\n",
    "#     weight_3[perturb_index] = 0 # 1...0...11\n",
    "    \n",
    "# #     lr_new_1 = SimplifiedGraphNeuralNetwork(l2_reg=1.0, fit_intercept=True)\n",
    "# #     train_x_delete_1 = train_x_orig[weight_1 == 1]\n",
    "# #     train_y_delete_1 = train_y_orig[weight_1 == 1]\n",
    "    \n",
    "# #     assert(np.allclose(train_x_delete_1, train_x))\n",
    "# #     assert(np.allclose(train_y_delete_1, train_y))\n",
    "    \n",
    "# #     lr_new_1.fit(train_x_delete_1, train_y_delete_1)\n",
    "# #     logits_test_y_new_1 = test_x @ lr_new_1.model.coef_.T + lr_new_1.model.intercept_\n",
    "# #     new_ori_val_loss_1, _ = lr_new_1.log_loss(logits_test_y_new_1, one_hot_labels_test)\n",
    "    \n",
    "    \n",
    "    \n",
    "#     lr_new_2 = SimplifiedGraphNeuralNetwork(l2_reg=l2_term, fit_intercept=True)\n",
    "#     train_x_delete_2 = train_x_orig[weight_3 == 1]\n",
    "#     train_y_delete_2 = train_y_orig[weight_3 == 1]\n",
    "    \n",
    "#     lr_new_2.fit(train_x_delete_2, train_y_delete_2)\n",
    "#     logits_test_y_new_2 = test_x @ lr_new_2.model.coef_.T + lr_new_2.model.intercept_\n",
    "#     new_ori_val_loss_2, _ = lr_new_2.log_loss(logits_test_y_new_2, one_hot_labels_test, l2_reg = True)\n",
    "    \n",
    "#     predict_influence_1.append(np.sum(pred_infl[perturb_index]) - np.sum(pred_infl[len(train_x):]))\n",
    "#     acctual_influence_1.append(new_ori_val_loss_2 - ori_val_loss)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "20717907",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAZwAAAEKCAYAAAAmfuNnAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/MnkTPAAAACXBIWXMAAAsTAAALEwEAmpwYAAA0cElEQVR4nO3dd3hUBdbH8e9J6BB6L6FJr0IABQsqKqCiWHbRXbsirr7u6q4Cxt6x7OquFXvBSo2IiLAqroqCKEkICb0GEmoSCOnn/ePe6BAmYYBpyZzP8+SZuWXu/HKTzMlt54qqYowxxgRaVKgDGGOMiQxWcIwxxgSFFRxjjDFBYQXHGGNMUFjBMcYYExRWcIwxxgRFSAuOiLwhIpkikuwxrrGIfCkia9zHRuW8dqSIpInIWhGZFLzUxhhjjkWot3DeAkaWGTcJWKSqXYBF7vAhRCQaeAEYBfQELheRnoGNaowx5niEtOCo6mJgT5nRFwJvu8/fBi7y8tLBwFpVXa+qBcCH7uuMMcaEqWqhDuBFC1XdDqCq20WkuZd52gBbPIa3AkO8LUxExgPjAerWrTuwe/fufo5rjDFVT0FRCdv2HWR/fhEFO9buUtVmx7vMcCw4vhAv47z26FHVqcBUgLi4OF22bFkgcxljTKVWXKK888NGnvoijZbAxFHduXpox03+WHY4FpwMEWnlbt20AjK9zLMVaOcx3BZID0o6Y4ypotZm5jBxRhI/b9rL6V2b8djFfWjTsDZX+2n54VhwEoCrgSfcxzle5lkKdBGRjsA2YBxwRdASGmNMFVJYXMIr36zj34vWUqdmNP/8Qz/GntgGEW87k45dSAuOiHwADAeaishW4H6cQvOxiFwPbAYuc+dtDbymqqNVtUhEbgW+AKKBN1R1ZSi+B2OMqcySt2Vx5/REVm3P5ry+rXjggl40i6kZkPcKacFR1cvLmXSWl3nTgdEew/OAeQGKZowxVVpeYTHPLlzDq9+up0ndGrxy5UDO7dUyoO8ZjrvUjDHGBNCP63czaWYSG3Yd4I9x7bj7vB40qF094O9rBccYYyJETl4hT85P490lm2jXuDbTbhjCsBOaBu39reAYY0wE+Cotk/iZSWzPzuO6YR35x7ldqVMjuCXACo4xxlRhew8U8PDcFGb+so0uzesx4+ahDIj12qIy4KzgGGNMFaSqfJa0nfvnrCTrYCG3ndWFW87oTM1q0SHLZAXHGGOqmIzsPO6dncyClAz6tm3AezcMoUer+qGOZQXHGGOqClXl42VbeOSzVRQUlXD36O5cN6wj1aJDfWMAhxUcY4ypAjbvzmXyrES+W7ubIR0bM+WSvnRoWjfUsQ5hBccYYyqx4hLlre838vQXaURHCY9c1JsrBscSFeXftjT+YAXHGGMqqdUZOdw1PZFft+zjzO7NeXRsb1o1qB3qWOWygmOMMZVMQVEJL3+zjv/8dw31albjuXH9GdOvtd+bbfqbFRxjjKlEVmzZx8QZiaTuyGFMv9bcf0FPmtQLTLNNf7OCY4wxlcDBgmKeXbiaV79dT7OYmrx2VRwjerYIdayjYgXHGGPC3A/rdjN5ZiIbd+dy+eBYJo/uTv1agW+26W9WcIwxJkxl5xXyxOepvP/jZto3qcP7Nw5haOfgNdv0Nys4xhgThv6bmsHdM5PJzMnjxlM7csfZ3ahdI3RtafzBCo4xxoSR3fvzeWhuCnN+TadbixhevnIg/ds1DHUsv7CCY4wxYUBVSViRzoOfppCTV8hfz+rCLWecQI1q4dGWxh/CsuCISDfgI49RnYD7VPVZj3mGA3OADe6omar6UJAiGmOM32zPOsg9s5JZlJpJv3YNefKSvnRrGRPqWH4XlgVHVdOA/gAiEg1sA2Z5mfVbVT0/iNGMMcZvSkqUD5du4fF5qygsKeGe83pw7bCORIdhWxp/CMuCU8ZZwDpV3RTqIMYY4y8bdx1g0sxElqzfw8mdmvDEJX1o3yS8mm36W2UoOOOAD8qZdrKIrADSgX+o6srgxTLGmKNXVFzCG99t4JkFq6kRHcXjF/dh3KB2Yd+Wxh/CuuCISA1gDDDZy+TlQHtV3S8io4HZQBcvyxgPjAeIjY0NXFhjjDmC1B3ZTJyeyIqtWYzo0ZxHLupDywa1Qh0raMK64ACjgOWqmlF2gqpmezyfJyIvikhTVd1VZr6pwFSAuLg4DXRgY4wpK7+omBe+WseLX62lQe3q/OfyEzm/b6uI2KrxFO4F53LK2Z0mIi2BDFVVERkMRAG7gxnOGGOO5JfNe5k4I5HVGfsZe2Ib7j2/J43r1gh1rJAI24IjInWAs4GbPMZNAFDVl4FLgZtFpAg4CIxTVduCMcaEhdyCIp5ZsJo3vttAy/q1eOOaOM7sXrmabfpb2BYcVc0FmpQZ97LH8+eB54OdyxhjjuT7tbuYNDOJzXty+fNJsUwc2Z2YSths09/CtuAYY0xlk3WwkMfnreLDpVvo2LQuH40/iSGdmhz5hRHCCo4xxvjBgpU7uGd2Mrv253PT6Z24fURXalWv3M02/c0KjjHGHIdd+/N5IGElcxO3071lDK9dHUfftg1DHSssWcExxphjoKrM/nUbD36aQm5+MXec3ZUJp3euUs02/c0KjjHGHKX0fQeJn5XEV2k7OTHWabbZpUXVa7bpb1ZwjDHGRyUlyrSfNjPl81SKS5T7zu/J1UM7VNlmm/5mBccYY3ywYdcBJs5I5KcNezjlhKY8fnEf2jWuE+pYlYoVHGOMqUBRcQmv/W8D//pyNTWqRfHkJX25LK5txLWl8QcrOMYYU46U9GzumrGC5G3ZnNurBQ9f2Jvm9SOn2aa/WcExxpgy8ouKef6/a3np63U0rFOdF/80gFG9W9pWzXGygmOMMR5+3uQ021ybuZ+LB7Th3vN60ihCm236mxUcY4wBDuQX8fSCNN76fiOtG9TmrWsHMbxb81DHqlKs4BhjIt63a3YyeWYSW/ce5MqT2jNxVHfq1bSPR3+zNWqMiVhZuYU8Oi+Fj5dtpVPTunx808kM7tg41LGqLCs4xpiIND95B/fOSWbPgQL+Mrwzt53VxZptBpgVHGNMRNmZ4zTb/CxpOz1b1efNawbRu02DUMeKCFZwjDERQVWZuXwbD81N4WBBMXee243xp3WierQ12wyWIxYcEbkMmK+qOSJyDzAAeERVlwc8nTHG+MHWvbncPSuZxat3MrB9I6Zc0pcTmtcLdayI48sWzr2q+omInAKcCzwNvAQMCWgyY4w5TiUlyns/bmLK56ko8OCYXlx5UnuirNlmSPhScIrdx/OAl1R1jog8ELhIDhHZCOS471+kqnFlpgvwHDAayAWusa0uY0ypdTv3M2lGIks37uW0rs14bGxv2jayZpuh5EvB2SYirwAjgCkiUhMI1k7PM1R1VznTRgFd3K8h2FaXMQYoLC7h1W/X8+zCNdSuHs3Tl/XjkgFtrC1NGPCl4PwBGAk8rar7RKQVcGdgY/nkQuAdVVVgiYg0FJFWqro91MGMMaGRvC2LiTMSWZmezeg+LXlgTC+ax1izzXDhS8FpBXymqvkiMhzoC7wTyFAuBRaIiAKvqOrUMtPbAFs8hre64w4pOCIyHhgPEBsbG7i0xpiQySss5t+L1vDK4vU0qlODl/88gJG9W4U6linDl4IzA4gTkROA14EE4H2cYyeBNExV00WkOfCliKSq6mKP6d62j/WwEU6hmgoQFxd32HRjTOW2dOMeJs5IZP3OA1w2sC33nNeTBnWqhzqW8cKXglOiqkUicjHwrKr+R0R+CXQwVU13HzNFZBYwGPAsOFuBdh7DbYH0QOcyxoSH/flFPDU/lXeWbKJ1g9q8c91gTuvaLNSxTAV8KTiFInI5cBVwgTsuoP8+iEhdIMq99qcucA7wUJnZEoBbReRDnJMFsuz4jTGR4ZvVO7l7ZhLpWQe5+uQO3HluN+pas82w58tP6FpgAvCoqm4QkY7Ae4GNRQtglntWSTXgfVWdLyITAFT1ZWAezm69tTinRV8b4EzGmBDbl1vAQ3NTmLl8G52b1WX6hJMZ2N6abVYW4pzkdYSZRGoAXd3BNFUtDGiqAImLi9Nly5aFOoYx5hjMS9rOfXOS2ZdbyITTO3PrmSdYs80gEZGfy14LeSx8aW0zHHgb2IhzoL6diFxd5gC+McYERGZ2HvfNWcn8lTvo3aY+b183mF6trdlmZeTLLrVngHNUNQ1ARLoCHwADAxnMGBPZVJVPft7KI3NTyC8qYdKo7txwSkeqWbPNSsuXglO9tNgAqOpqEbFzDo0xAbNlTy6TZybxv7W7GNyhMU9c0odOzazZZmXnS8FZJiKvA++6w38Cfg5cJGNMpCouUd75YSNPzk8jSuDhi3rzp8Gx1myzivCl4NwM3ALchnMMZzHwYiBDGWMiz9rMHO6ansjyzfsY3q0Zj47tQ5uGtUMdy/jREQuOquYD/3S/jDHGrwqLS3jlm3X8e9Fa6tSM5l9/7MdF/a3ZZlVUbsERkSS8tIoppap9A5LIGBMxkrZmcef0FaTuyOG8vq14cEwvmtarGepYJkAq2sI5P2gpjDERJa+wmGcXruHVb9fTpG4Npl45kHN6tQx1LBNg5RYcVd0UzCDGmMjw4/rdTJqZxIZdBxg3qB2TR/egQW078TUSWPMhY0xQ5OQVMmV+Ku8t2Uy7xrWZdsMQhp3QNNSxTBBZwTHGBNxXqZnEz0pie3Ye15/Skb+f05U6NezjJ9LYT9wYEzB7DhTw8NwUZv2yjS7N6zHj5qEMiG0U6lgmRHzppTYMeABo784vgKpqp8BGM8ZUVqrKZ0nbuX/OSrIOFnLbWV245YzO1KxmzTYjmS9bOK8Dt+N0FygObBxjTGWXkZ3HPbOT+TIlg75tG/DeDUPo0ap+qGOZMOBLwclS1c8DnsQYU6mpKh8v28Ijn62ioKiE+NE9uHZYB2u2aX7jS8H5SkSeAmYC+aUjVXV5wFIZYyqVzbtzmTQzke/X7WZIx8ZMuaQvHZrWDXUsE2Z8KThD3EfPm+8ocKb/4xhjKpPiEuXN7zbw9II0qkVF8djYPowb1M6abRqvfOmldkYwghhjKpfVGU6zzV+37OPM7s15dGxvWjWwZpumfBX1Uvuzqr4nInd4m66qAWvmKSLtgHeAlkAJMFVVnyszz3BgDrDBHTVTVR8KVCZjjKOgqISXvl7H81+tIaZWdZ4b158x/Vpbs01zRBVt4ZTugI0JRpAyioC/q+pyEYkBfhaRL1U1pcx836qq9XwzJkhWbNnHxBmJpO7I4YJ+rXnggp40sWabxkcV9VJ7xX18MHhxfnvv7cB293mOiKwC2gBlC44xJggOFhTzr4Wree3b9TSPqcVrV8UxomeLUMcylUzYdxoQkQ7AicCPXiafLCIrgHTgH6q60svrxwPjAWJjYwOY1Jiq6Yd1u5k0M5FNu3O5Ykgsk0Z1p34ta7Zpjl5YFxwRqQfMAP6mqtllJi8H2qvqfhEZDcwGupRdhqpOBaYCxMXFlXt/H2PMobLzCnl8Xiof/LSZ9k3q8P6NQxja2ZptmmMXtgVHRKrjFJtpqjqz7HTPAqSq80TkRRFpqqq7gpnTmKpoYUoG98xOJjMnj/GndeL2EV2pXcPa0pjj40svtRbAY0BrVR0lIj2Bk1X19UCFEud0l9eBVeWdDSciLYEMVVURGQxEAbsDlcmYSLB7fz4PfppCwop0urWI4eUrB9K/XcNQxzJVhC9bOG8BbwLx7vBq4COcghAow4ArgSQR+dUddzcQC6CqLwOXAjeLSBFwEBinqrbLzJhjoKokrEjngYSV7M8v4vYRXbl5eGdqVLO2NMZ/fCk4TVX1YxGZDKCqRSIS0Caeqvo/nK7UFc3zPPB8IHMYEwm2Zx3knlnJLErNpH+7hjx5aV+6tgjF1RCmqvPl35cDItIEp50NInISkBXQVMYYv4uPhz59nEeAkhJl2o+bOPufi/lu3S7uOa8HM24eelTFpuwyjamIL1s4dwAJQGcR+Q5ohrM7yxhTScTHw2OPOc+TkyFHD5DZIZEl6/cwtHMTnri4L7FN6hzXMgEefdSPoU2V40svteUicjrQDWc3V5qqFgY8mTHGbxIS3CdSQv1BG0goXE1MehRTLunDH+LaHVNbmt+W6TFsBcdUxJez1C4uM6qriGQBSaqaGZhYxhh/GjMG0jKyaTIqkZqtsmhLC2bc0ZsW9Wsd1zJLt2xKh42piC+71K4HTga+coeHA0twCs9DqvpugLIZY/wgv6iYJsPX0aZ4LeRXZ5icyLuPtTruZpulWzMJCU6xsa0bcyS+FJwSoIeqZsBv1+W8hHOfnMWAFRxjwtTyzXuZOD2RNZn7GXtiG+47vyeN6tbw2/IffdQKjfGdLwWnQ2mxcWUCXVV1j4jYsRxjwlBuQRHPLFjNG99toGX9Wrx5zSDO6N481LFMhPOl4HwrInOBT9zhS4DFIlIX2BeoYMaYoxcfD6/P3UWNYYlE1T/In0+KZeLI7sRU0GwzPt52i5ng8KXg3IJTZIbhnKX2DjDDvarf7gZqTJi48+5C3vhlFTGjtlC4py6Z005Co5sQc1H5r7FTm00wSSR1g4mLi9Nly5aFOoYxfhMfD6++CtGxO6h+cjJSu4DsnzqR9V0XtCia3r0hKan81/fpc+iZZkea30QmEflZVeOOdzm+nhY9BWiOs4UjgKpq/eN9c2PM0SvdBbZ3L2zfm0/jESup2WM7BZkx7P5kEAUZDX6b90inKtupzSaYfNml9iRwgaquCnQYY0zFft8FptTtuY3Wl6QQVb2YvYu7kv1jZyj5vVvV0KFH3j1mpzabYPKl4GRYsTEm9BISYMoUiI45SJNzk6jdeSd52xqy+/O+FO0+vP9ZdtlbFpbDTm02weJLwVkmIh/h3FEzv3Skt5uiGWMC47LLYPp0pV7/zTQavgoE9izsSc7yDqDeL+C03WMm3PhScOoDucA5HuMUsIJjTIA5hQaqNdpPiyuSqNVuDwc3NmXP/D4UZR3ebHPoUGfLxnaPmXDkS/POa4MRxBjzu9+O1UgJ9QdvoMEpq9HiKHbN68uBpLaUvV1UtWpw111WZEx48+UstVo4/dR6Ab91+lPV6wKYy5iIVdrirHqzbJqMXkHNltnkprVgz5e9KT7gvdmmFRtTGfhyA7Z3gZbAucA3QFsgJ5ChjIk08fFOoREBootpeGoara7+H9Xq5bNz1gB2zo7zWmxq1oS777ZiYyoHXwrOCap6L3BAVd8GzgP6BDYWiMhIEUkTkbUiMsnLdBGRf7vTE0VkQKAzGeNvpYWm9Gr/mm320Oqa/9Fg6FoOpLQh/fXTyF3dqtzX//3vVmxM5eHLSQOlDTr3iUhvYAfQIWCJABGJBl4Azga2AktFJEFVUzxmGwV0cb+G8HsHa2MqBc+7A0j1IhqelkbMwI0UZ9cm4+NB5G3w3myzTRto1MhODDCVjy8FZ6qINALuxbnVdD3gvoCmgsHAWlVdDyAiHwIXAp4F50LgHben2xIRaSgirVR1e4CzGXPcPItNrQ47aTIyiWoNDpL9c3v2Le6OFhz+p1mjBvzjH1ZkTOXly1lqr7lPvwE6BTbOb9oAWzyGt3L41ou3edoAhxQcERkPjAeIjY31e1BjjsawYfD9987zqJqFNDorhXp9tlK4uy473juZ/G2ND3tN7dpw++1WaEzl58tZajVxukV38JxfVR8KXCy8XclWtsuoL/OgqlOBqeA07zz+aMYcm5gY2L/feV6763Yan72S6DoFZP3QmX3fdYHi6MNeM3QofPddkIMaEyC+7FKbA2QBP+PRaSDAtgLtPIbbAunHMI8xYaFtW6fYRNXNo/HZK6nbbQcFGfXZOf3QZpul6tWDHDsX1FQxvhSctqo6MuBJDrUU6CIiHYFtwDjgijLzJAC3usd3hgBZdvzGhJv4eHjySSgqUur23kqjM1c5zTa/6Ub2T50OabZZyk5zNlWVLwXnexHpo6pBu0uGqhaJyK3AF0A08IaqrhSRCe70l4F5wGhgLU7rHeuIYMJG6X1qdu6E6Pq5NB+ZRO2Ou8jb2shptrmnXqgjGhN05d6ATUSScI6JVMM59Xg9zi610vvh9A1WSH+xG7CZYPC8hUDMgI00PD0NgH3fdCdneXu8H378nd0EzYSbYNyA7fzjXbgxkSghAao13k+TUYnUaruXg+ubsfuL3hRnH95ss1kz6NLl9zPXwLo8m6qr3IKjqpsAROQkYKWq5rjDMUBPYFNQEhpTiRQWlyA919P63DWUFEaz67N+HEhug7etmltugeefd56X3sXTLuY0VZkvx3BeAjzbxhzwMs6YiJaQAJ8szGJDs0SyO2aTm9qSPQt7UVJOs806deAcjxt+2E3QTCTwpeCIehzoUdUSEfHldcZUefHx8N77xezvsIZ6g9ZTklmD3QsGcNBL/zMRmDwZsrIgI8N57Y8/WqExkcOXwrFeRG7D2aoB+AvOCQTGRLT4eHjm7T00GZVITJMD7E9sy97/9qQkv/ph8w4cCPfd5+wyi4+HF15wxicnO49WdEwk8KVb9ARgKM71MKUtZsYHMpQx4W5/fhEfr0umxZ9+QKJLyPhoMLs/73dYsYmOdq6rWbbs95MBEhIOXVbZYWOqKl96qWXiXHhpjAG+Wb2Tu2cmUdjhIDnLOrBvcTe0sBoDB0LHjs4toUtNnHj41suYMb9v2ZQOGxMJ7FiMMT7al1vAQ3NTmLl8Gy1q12Vo7skUNmpMajeoXx+ys6FrV2eLpqIzzkrH2VlpJtKUe+FnVWQXfppj9eAb25mWmkxRdCEj2nRm2t0nkJsTTZ06MHr0oVs11prGVDX+uvDTl2M4xkSszOw8LnzyZ95cvZyczFrsen8Y2z7vRm6O09k5Nxf++99DX2PHZIzxrtxdaiJyR0UvVNV/+j+OMeFBVfnk5608MjeF/QdL2PtNd7J/6ggaBb2d62hyc53HM888dAvHjskY411Fx3Bi3MduwCCc7swAFwCLAxnKmFDasieXu2cl8e2aXQzu0JhzGvXhr8/XA3UKzE03OV8LFjgXb5ae6mzHZIyp2BGP4YjIAuCSMq1tPgnBLQuOmx3DMRUpLlHe+WEjT32RhgCTRnXnT0PaExUlJCQcWmCMiSTBaN5ZKhYo8BguwLn7pzFVxtrMHO6ansjyzfsY3q0Zj47tQ5uGtX+bPmaMFRpjjpcvBedd4CcRmYVzu4KxwDsBTWVMkBQWl/DKN+v496K11KkZzT//0I+xJ7ZBpOJbCBhjjp4vF34+KiKfA6e6o65V1V8CG8uYwEvamsWd01eQuiOH8/q24sExvWhar2aoYxlTZfl64WcdIFtV3xSRZiLSUVU3BDKYMYGSV1jMswvX8Oq362lStwavXDmQc3u1DHUsY6q8IxYcEbkfiMM5W+1NoDrwHjAssNGM8b+fNuxh4oxENuw6wB/j2nH3eT1oUPvwZpvGGP/zZQtnLHAisBxAVdPdM9UCQkSewjn1ugBYh7MLb5+X+TYCOUAxUOSPMyhM1ZWTV8iT89N4d8km2jWuzbQbhjDshKahjmVMRPGl4BSoqoqIAohI3QBn+hKYrKpFIjIFmAxMLGfeM1R1V4DzmEruq9RM4mclsT07j+tP6cjfz+lKnRrWRtCYYPPlr+5jEXkFaCgiNwLXAa8FKpCqLvAYXAJcGqj3MlXbngMFPDw3hVm/bKNL83rMuHkoA2IbhTqWMRHLl7PUnhaRs4FsnOM496nqlwFP5rgO+Ki8aMACd8vrFVWd6m0mERmPe/+e2NjYgIQ04UVV+SxpO/fPWUnWwUJuO6sLt5zRmZrVokMdzZiI5stJA1NUdSLOrq6y446JiCwEvJ0WFK+qc9x54oEiYFo5ixnmHk9qDnwpIqmqeljLHbcQTQWn08CxZjaVQ0Z2HvfMTubLlAz6tm3AezcMoUer+qGOZYzBt11qZ3P4MZRRXsb5TFVHVDRdRK4GzgfO0nJ676hquvuY6V6UOhjr8RaxVJWPlm7h0XmrKCgqIX50D64d1oFq0dYQ3ZhwUVG36JuBvwCdRSTRY1IM8H2gAonISJxidrqq5pYzT10gSlVz3OfnAA8FKpMJb5t2H2DyzCS+X7ebIR0bM+WSvnRoGuhzW4wxR6uiLZz3gc+Bx4FJHuNzVHVPADM9D9TE2U0GsERVJ4hIa+A1VR0NtABmudOrAe+r6vwAZjJhqLhEefO7DTy9II1qUVE8NrYP4wa1IyrK2tIYE47KLTiqmgVkichzwB7PbtEiMkRVfwxEIFU9oZzx6cBo9/l6oF8g3t9UDmk7crhrRiIrtuzjrO7NeWRsb1o1qH3kFxpjQsaXYzgvAQM8hg94GWdMUBQUlfDi12t54au1xNSqznPj+jOmX2trtmlMJeBLwRHPA/eqWiIidtWcCboVW/Zx1/RE0jJyuLB/a+47vydNrNmmMZWGL4VjvYjchrNVA86JBOsDF8mYQx0sKOafX6bx+v820DymFq9dFceIni1CHcsYc5R8KTgTgH8D9+BcbLkI90JKYwLth3W7mTQzkU27c7liSCyTRnWnfi1rtmlMZeRLp4FMYFwQshjzm+y8Qh6fl8oHP22mfZM6vH/jEIZ2tmabxlRmFV2Hc5eqPiki/8HZsjmEqt4W0GQmYi1alUH8rGQyc/K48dSO3HF2N2rXsLY0xlR2FW3hrHIflwUjiDG79+fz4KcpJKxIp1uLGF6+ciD92zUMdSxjjJ9UdB3Op+7j28GLYyKRqpKwIp0HP00hJ6+Q20d05ebhnalRzdrSGFOVVLRL7VO87EorpapjApLIRJTtWQe5d3YyC1dl0r9dQ568tC9dWwTs/n7GmBCqaJfa0+7jxTidnd9zhy8HNgYwk4kAJSXKh0u38Pi8VRSWlHDPeT24dlhHoq0tjTFVVkW71L4BEJGHVfU0j0mfioh1ZTbHbOOuA0yamciS9XsY2rkJT1zcl9gmdUIdyxgTYL5ch9NMRDq5/csQkY5As8DGMlVRUXEJb3y3gWcWrKZGdBRPXNyHPw5qZ21pjIkQvhSc24GvRaS0u0AH4KaAJTJVUuqObCZOT2TF1ixG9GjBIxf1pmWDWqGOZYwJIl8u/JwvIl2A7u6oVFXND2wsU1XkFxXz4lfrePHrtdSvVZ3nrziR8/q0sq0aYyKQL7eYrgPcAbRX1RtFpIuIdFPVuYGPZyqzXzbvZeKMRFZn7GfsiW247/yeNKpbI9SxjDEh4ssutTeBn4GT3eGtwCeAFRzjVW5BEc8sWM0b322gZf1avHnNIM7o3jzUsYwxIeZLwemsqn8UkcsBVPWg2P4QU47v1+5i0swkNu/J5c8nxTJxZHdirNmmMQbfCk6BiNTGvQhURDoDdgzHHCLrYCGPz1vFh0u30LFpXT4afxJDOjUJdSxjTBjxpeDcD8wH2onINGAYcE2gAonIA8CNwE531N2qOs/LfCOB54Bo4DVVfSJQmUzFFqzcwT2zk9l9oIAJp3fmbyO6UKu6Nds0xhyqwoIjIlFAI5xuAycBAvxVVXcFONe/VPXp8iaKSDTwAnA2zjGlpSKSoKopAc5lPOzan88DCSuZm7id7i1jeP3qQfRp2yDUsYwxYarCguPeTvpWVf0Y+CxImXwxGFjrcTHqh8CFgBWcIFBVZv+6jQc/TSE3v5i/n92VCcM7Uz3amm0aY8rnyy61L0XkH8BHwIHSkaq6J2Cp4FYRuQrn1gh/V9W9Zaa3AbZ4DG8FhnhbkIiMx71DaWxsbACiRpb0fQeJn5XEV2k7GRDbkCmX9KWLNds0xvjAl4Jznft4i8c4BTod65uKyEKchqBlxQMvAQ+77/Ew8IxHht8W4eW1Xjtbq+pUYCpAXFxcud2vTcVKSpRpP21myuepFJco91/Qk6tO7mDNNo0xPvOl00BHf7+pqo7wZT4ReRXv1/tsBdp5DLcF0v0QzXixfud+Js1I4qeNezjlhKY8fnEf2jW2ZpvGmKPjS6eBWsBfgFNwtiK+BV5W1bxABBKRVqq63R0cCyR7mW0p0MVtJLoNGAdcEYg8kayouISp367n2YVrqFUtiicv7ctlA9taWxpXfDwkJMCYMfDoo6FOY0z482WX2jtADvAfd/hy4F3gsgBlelJE+uMUt424jUJFpDXO6c+jVbVIRG4FvsA5LfoNVV0ZoDwRaWV6FhNnJJK8LZtze7Xg4Qt707y+NdssFR8Pjz3mPE92/yWyomNMxUS14sMaIrJCVfsdaVxlEBcXp8uWLQt1jLCWV1jMf/67hpe/WU+jOjV4+MJejOrTKtSxwk6fPr8XGoDevSEpKXR5jAkkEflZVeOOdzm+bOH8IiInqeoS942HAN8d7xub8PPzpj3cNT2RdTsPcMmAttx7fg8a1rFmm96MGXNowRljN1w35oh8KThDgKtEZLM7HAusEpEkQFW1b8DSmaA4kF/EU1+k8fYPG2ndoDZvXzeY07vaPfYqUrr7zI7hGOM7X3apta9ouqpu8muiALJdaodbvHonk2cmkZ51kKtOas+dI7tTr6Yv/4cYYyJF0HapVaaCYnyXlVvIw5+lMP3nrXRqVpePbzqZQR0ahzqWMaYKs39lI9D85O3cO2clew4UcMsZnfm/M63ZpjEm8KzgRJDMnDzun7OSz5N30Kt1fd66dhC9WluzTWNMcFjBiQCqyozl23h4bgoHC4u5a2Q3bjy1kzXbNMYElRWcKm7r3lzunpXM4tU7GdShEU9c0pfOzeqFOpYxJgJZwamiSkqUd5dsYsr8VAAeurAXfx7SnihrtmmMCRErOFXQ2sz9TJqRyLJNezmtazMeG9ubto2s2aYxJrSs4FQhhcUlTF28nucWraF29WievqwflwxoY802jTFhwQpOFZG8LYu7pieSsj2b0X1a8sCYXjSPsWabxpjwYQWnkssrLOa5RWuYung9jevW4OU/D2Bkb2u2aYwJP1ZwKrGlG/cwcXoi63cd4LKBbbnnvJ40qFM91LGMMcYrKziV0P78Ip6cn8o7P2yibaPavHv9YE7tYs02jTHhzQpOJfN1Wibxs5JJzzrINUM7cOe53ahrzTaNMZWAfVJVEnsPFPDwZynMXL6NE5rXY/qEoQxs3yjUsYwxxmdWcMKcqjIvaQf3JySzL7eQ2848gVvOPIGa1azZpjGmcgm7giMiHwHd3MGGwD5V7e9lvo1ADlAMFPnjXg3hJjM7j3tmJ7MgJYM+bRrwznVD6Nm6fqhjGWPMMQm7gqOqfyx9LiLPAFkVzH6Gqu4KfKrgUlU+WbaVhz9LoaCohMmjunP9KR2pZs02jTGVWNgVnFLiXB7/B+DMUGcJpi17cpk8M4n/rd3F4I6NeeLiPnSyZpvGmCogbAsOcCqQoaprypmuwAIRUeAVVZ0avGj+V1yivP39Rp76Io3oKOGRi3pzxeBYa7ZpjKkyQlJwRGQh0NLLpHhVneM+vxz4oILFDFPVdBFpDnwpIqmqutjLe40HxgPExsYeZ/LAWJORw8QZiSzfvI8zujXj0bF9aN2wdqhjGWOMX4mqhjrDYUSkGrANGKiqW32Y/wFgv6o+XdF8cXFxumzZMv+E9IPC4hJe/nod//nvWurWjOb+C3pxYf/W1mzTGBNWRORnf5yYFa671EYAqeUVGxGpC0Spao77/BzgoWAGPF6JW/dx1/REUnfkcH7fVjwwphdN69UMdSxjjAmYcC044yizO01EWgOvqepooAUwy90SqAa8r6rzg57yGOQVFvOvL1fz6rfraRZTk1eviuPsni1CHcsYYwIuLAuOql7jZVw6MNp9vh7oF+RYx23J+t1MnpnEhl0HGDeoHZNH96BBbWu2aYyJDGFZcKqanLxCnvg8lWk/bqZd49pMu2EIw05oGupYxhgTVFZwAuyr1EzunpVERnYeN5zSkTvO6UqdGrbajTGRxz75AmTPgQIe+nQls39Np0vzerx481BOjLVmm8aYyGUFx89UlbmJ23kgYSVZBwv561ld+MsZna3ZpjEm4lnB8aOM7DziZyWzcFUG/do2YNqNQ+je0pptGmMMWMHxC1Xlo6VbeHTeKgqLS4gf3YPrTulItLWlMcaY31jBOU6bdh9g0owkfli/m5M6NeaJi/vSoWndUMcyxpiwYwXnGBWXKG9+t4GnF6RRPSqKx8b2YdygdtZs0xhjymEF5xik7cjhrhmJrNiyj7O6N+eRsb1p1cCabRpjTEWs4ByFgqISXvx6LS98tZaYWtV5blx/xvSzZpvGGOMLKzg++nXLPiZOTyQtI4cL+7fm/gt60bhujVDHMsaYSsMKzhEcLCjmn1+m8fr/NtA8phavXx3HWT2s2aYxxhwtKzgV+H7dLibNSGLznlyuGBLLpFHdqV/Lmm0aY8yxsILjRXZeIY/PS+WDnzbTvkkdPrjxJE7u3CTUsYwxplKzglPGwpQM4mcnsTMnn5tO68TfRnSldg1rS2OMMcfLCo5r9/58Hvw0hYQV6XRvGcOrV8XRt23DUMcyxpgqI+ILjqqSsCKdBxJWsj+/iDvO7sqE0ztTo1pUqKMZY0yVEtEFZ3vWQe6Zlcyi1Ez6t2vIk5f2pWuLmFDHMsaYKikiC05JifLB0s08Pi+V4hLl3vN7cs3QDtZs0xhjAigk+41E5DIRWSkiJSISV2baZBFZKyJpInJuOa9vLCJfisga99HnO5tt3HWAK15bQvysZPq1a8AXfzuN662zszHGBFyoDlQkAxcDiz1HikhPYBzQCxgJvCgi3k4RmwQsUtUuwCJ3+Ih27s/n3GcXszI9mymX9OG964cQ26TO8XwfxhhjfBSSXWqqugrw1oPsQuBDVc0HNojIWmAw8IOX+Ya7z98GvgYmHul9d2TlcVXXZjxyUW9a1K91zPmNMcYcvXA7htMGWOIxvNUdV1YLVd0OoKrbRaR5eQsUkfHAeHcw/7WrByW/5q+0gdMU2BXqED6wnP5TGTKC5fS3ypKzmz8WErCCIyILgZZeJsWr6pzyXuZlnB5PDlWdCkx1My1T1bgjvCTkLKd/VYaclSEjWE5/q0w5/bGcgBUcVR1xDC/bCrTzGG4LpHuZL0NEWrlbN62AzGPJaIwxJnjC7erGBGCciNQUkY5AF+Cncua72n1+NVDeFpMxxpgwEarToseKyFbgZOAzEfkCQFVXAh8DKcB84BZVLXZf85rHKdRPAGeLyBrgbHfYF1P9+G0EkuX0r8qQszJkBMvpbxGVU1SP6xCJMcYY45Nw26VmjDGmirKCY4wxJiiqXMEJZduc48j8kYj86n5tFJFfy5lvo4gkufP55TTFoyEiD4jINo+so8uZb6S7jteKiE9dIPyY8SkRSRWRRBGZJSINy5kvJOvySOtGHP92pyeKyIBgZfPI0E5EvhKRVe7f0l+9zDNcRLI8fhfuC3ZON0eFP8cwWZ/dPNbTryKSLSJ/KzNPSNaniLwhIpkikuwxzqfPwGP6O1fVKvUF9MC5SOlrIM5jfE9gBVAT6AisA6K9vP5JYJL7fBIwJcj5nwHuK2faRqBpCNftA8A/jjBPtLtuOwE13HXeM4gZzwGquc+nlPfzC8W69GXdAKOBz3GuSTsJ+DEEP+dWwAD3eQyw2kvO4cDcYGc72p9jOKxPL78DO4D24bA+gdOAAUCyx7gjfgYe6995ldvCUdVVqprmZdJvbXNUdQNQ2jbH23xvu8/fBi4KSFAvxOn18wfgg2C9ZwAMBtaq6npVLQA+xFmnQaGqC1S1yB1cgnMtV7jwZd1cCLyjjiVAQ/das6BR1e2qutx9ngOswnvHj8og5OuzjLOAdaq6KYQZfqOqi4E9ZUb78hl4TH/nVa7gVKANsMVj2Ke2OUC5bXMC4FQgQ1XXlDNdgQUi8rPbsicUbnV3TbxRzqa2r+s5GK7D+e/Wm1CsS1/WTTitP0SkA3Ai8KOXySeLyAoR+VxEegU32W+O9HMMq/WJ05y4vH8ow2F9gm+fgce0XsOtl5pPJEza5hwNHzNfTsVbN8NUNV2c3nFfikiq+x9KUHICLwEP46y3h3F2/11XdhFeXuvX9ezLuhSReKAImFbOYgK+Lr3wZd2E9PfUk4jUA2YAf1PV7DKTl+PsFtrvHsubjXOhdrAd6ecYTuuzBjAGmOxlcrisT18d03qtlAVHK2HbnCNlFpFqOLdsGFjBMtLdx0wRmYWzWevXD0lf162IvArM9TLJ1/V8zHxYl1cD5wNnqbvD2csyAr4uvfBl3QR8/flCRKrjFJtpqjqz7HTPAqSq80TkRRFpqqpBbUTpw88xLNanaxSwXFUzyk4Il/Xp8uUz8JjWayTtUgv3tjkjgFRV3eptoojUFZGY0uc4B8eTvc0bKGX2fY8t5/2XAl1EpKP7H904nHUaFCIyEudWFWNUNbeceUK1Ln1ZNwnAVe7ZVScBWaW7N4LFPZb4OrBKVf9Zzjwt3fkQkcE4nyW7g5fS559jyNenh3L3YITD+vTgy2fgsf2dB/usiEB/4XwQbgXygQzgC49p8ThnVqQBozzGv4Z7RhvQBOembmvcx8ZByv0WMKHMuNbAPPd5J5wzQVYAK3F2HwV73b4LJAGJ7i9Xq7I53eHROGc2rQt2TpyTQbYAv7pfL4fTuvS2boAJpT97nF0VL7jTk/A40zKIGU/B2T2S6LEeR5fJeau77lbgnJwxNAQ5vf4cw219ujnq4BSQBh7jQr4+cQrgdqDQ/dy8vrzPQH/8nVtrG2OMMUERSbvUjDHGhJAVHGOMMUFhBccYY0xQWMExxhgTFFZwjDHGBIUVHFPluZ14hx7nMvYfxbxvicilx/N+/iIi3x/l/GGT3VQ9VnBMJBgOHFfBqaxUNSK/bxOerOCYSklEZrsNG1d6Nm1079Gx3G2CuMhtPjkBuN29z8ipZf+LL916EZF67muWi3OPlSN2vxWRq9xmpitE5F2PSaeJyPcisr70vcpbvoh0EOfeM6+6388CEantThvkLv8Hce71k+yOj3aHl7rTbyonX+n3NlxEvhaR6eLcL2ha6ZXtFXxvZ4nIL27WN0Skpjv+CRFJcd/3aXfcZSKS7K6HQLcIMpVVKK66tS/7Ot4vfr/6uTZOO5MmQDOcLgMdy8zzAB738cHp6nCpx/B+97EaUN993hSna4F4zlMmQy+crhVNy7zfW8AnOP/Q9cRp417u8oEOOI1G+7vTPgb+7D5Pxr3qHHgC974lwHjgHvd5TWBZ6fddJmPp9zYcyMLpeRUF/ACc4mX+t4BLgVruuuzqjn8H+BvQ2P2eS9dLQ/cxCWjjOc6+7Kvsl23hmMrqNhEpbQPSDqc33knAYnXud4Sqlr3Px5EI8JiIJAILcdqtt6hg/jOB6eo2WCzzfrNVtURVUzyWUdHyN6jqr+7zn4EO4tytNEZVS4/DvO+x/HNweoT9inPrgCYcubvwT6q6VVVLcNrVdKhg3m5uptXu8Ns4N+vKBvKA10TkYqC0X913wFsiciPOzbmMOUyl7BZtIpuIDMdpdnqyquaKyNc4/5ELvrWeL8LdnezuVqrhjv8TzlbSQFUtFJGN7nLLjVLB++WXme9Iy/ecvxhny62iXV4C/J+qflHBPBVlKqbiv3+v762qRW5zybNwGjbeCpypqhNEZAhwHvCriPRX1VA1nzRhyrZwTGXUANjrFpvuOFs24OwmOl2cbuCISGN3fA7OrZJLbeT320BcCFT3WG6mWwzOANofIcci4A8i0qTM+1WU2+flq+peIMftcgzOB3ypL4CbxbmNACLS1e2Y7C+pOFtZJ7jDVwLfiHOPnAaqOg9nF1t/9/07q+qPqnofsItDW9cbA9gWjqmc5gMT3F1TaTi71VDVne4JBDNFJArnPh5nA58C092D9P8HvArMEZGfcIrGAXe504BPRWQZzi6n1IpCqOpKEXkU54O4GPgFuKaClxzV8l3XA6+KyAHga5zjMOB0OO8ALHe30nbix9uhq2qeiFwLfCLOvZqWAi/jHMOZIyKlW5S3uy95SkS6uOMW4XQ9NuYQ1i3amDAmIvVUtfRMs0k4t4T4a4hjGXNMbAvHmPB2nohMxvlb3UTFW1DGhDXbwjHGGBMUdtKAMcaYoLCCY4wxJiis4BhjjAkKKzjGGGOCwgqOMcaYoPh/LqXXgegzKM8AAAAASUVORK5CYII=\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Number of edges in consider 13264\n"
     ]
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "low_limit = -10\n",
    "up_limit = 10\n",
    "x = np.linspace(low_limit, up_limit)\n",
    "# x = np.linspace(-0.2, 0.15)\n",
    "plt.plot(x, x)\n",
    "plt.scatter(acctual_influence_1, predict_influence_1, s = 10, color='blue')\n",
    "plt.xlabel('actual change in loss')\n",
    "plt.ylabel('predicted change in loss')\n",
    "# plt.title('Influence function on edges of Cora dataset perturb edges:' + str(batch_edges))\n",
    "# plt.title('Influence function on Complete Node of Citeseer dataset')\n",
    "plt.ylim(low_limit, up_limit)\n",
    "plt.xlim(low_limit, up_limit)\n",
    "# plt.title('Influence function on Iris dataset')\n",
    "plt.show()\n",
    "print('Number of edges in consider %d'% len(f_l))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "544cd674",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([], dtype=float32)"
      ]
     },
     "execution_count": 21,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "extra_index_train"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "ae4d8bc9",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([ 0.00818464, -0.0257164 , -0.04345373, ...,  0.02806713,\n",
       "       -0.02714676, -0.0080532 ])"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.array(acctual_influence_1)[np.array(acctual_influence_1) !=0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "ba34e6ac",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "SpearmanrResult(correlation=0.645962574971654, pvalue=0.0)"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "scipy.stats.spearmanr(np.array(acctual_influence_1)[np.array(acctual_influence_1) !=0], np.array(predict_influence_1)[np.array(predict_influence_1) !=0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "f7a6ad37",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "SpearmanrResult(correlation=0.5967557747249025, pvalue=0.0)"
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "scipy.stats.spearmanr(acctual_influence_1, predict_influence_1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "33d25abe",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.DataFrame([acctual_influence_1, predict_influence_1, f_l.numpy().astype(int), t_l.numpy().astype(int)]).T\n",
    "df.columns = ['acctual_influence', 'predict_influence', 'from_edges', 'to_edges']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "bac1c355",
   "metadata": {},
   "outputs": [],
   "source": [
    "df.to_csv('result_data/' + data_set + '_edge_influence_002.csv', header = None, index = False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "61b3a5cc",
   "metadata": {},
   "outputs": [],
   "source": [
    "# import pandas as pd\n",
    "# df = pd.read_csv('result_data/pubmed_edge_influence.csv', header = None)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "68f7f35e",
   "metadata": {},
   "outputs": [],
   "source": [
    "# import matplotlib.pyplot as plt\n",
    "# import numpy as np\n",
    "# low_limit = -10\n",
    "# up_limit = 10\n",
    "# x = np.linspace(low_limit, up_limit)\n",
    "# # x = np.linspace(-0.2, 0.15)\n",
    "# plt.plot(x, x)\n",
    "# plt.scatter(df[0], df[1], s = 10, color='blue')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "id": "6d20e840",
   "metadata": {},
   "outputs": [],
   "source": [
    "# g = dgl.graph(([1, 1, 2, 3, 4], [0, 2, 0, 4, 2]))\n",
    "# g.edata['w'] = torch.arange(10).view(5, 2)\n",
    "# sg, inverse_indices = dgl.khop_in_subgraph(g, 0, k=2)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
