{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "f7bfcb4f",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Using backend: pytorch\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.append('..')\n",
    "\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "from pyvis.network import Network\n",
    "from tqdm import tqdm\n",
    "import os\n",
    "import dgl\n",
    "import torch\n",
    "import networkx as nx\n",
    "from dataset import load_graph_dataset"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "bf120cee",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "  NumNodes: 2708\n",
      "  NumEdges: 10556\n",
      "  NumFeats: 1433\n",
      "  NumClasses: 7\n",
      "  NumTrainingSamples: 140\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n"
     ]
    }
   ],
   "source": [
    "graph, feat, labels, train_mask, val_mask, test_mask, number_classes = load_graph_dataset('cora')\n",
    "train_mask = train_mask.numpy()\n",
    "train_node_index= np.where(train_mask == 1)[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 160,
   "id": "9a084daa",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([4, 4, 4, ..., 4, 3, 3])"
      ]
     },
     "execution_count": 160,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "labels.numpy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "095c4c7f",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "ef7d817c",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_node_feature = pd.read_csv('node_feature_2/cora.csv')\n",
    "df_node_preprocessed = df_node_feature.drop(columns = ['predicted influence'])\n",
    "df_node_preprocessed['node_id'] = train_node_index\n",
    "df_node_preprocessed = df_node_preprocessed.sort_values(['actual influence'], ascending = False)\n",
    "df_node_preprocessed.index = range(len(df_node_preprocessed))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "39d20157",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_edge = pd.read_csv('edge_feature/cora_edge_influence_001.csv', header = None)\n",
    "df_edge.columns = ['actual_influence', 'predicted_influence', 'from_edges', 'to_edges']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "905cb5cf",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_edge_influence = df_edge.groupby(['from_edges', 'to_edges']).sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "3f9bc877",
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_actual_edge_influence(df_edge):\n",
    "    new_infl = []\n",
    "    df_edge_copy = df_edge.copy()\n",
    "    for i in tqdm(range(len(df_edge))):\n",
    "        f = df_edge.loc[i, ['from_edges']].values[0]\n",
    "        t = df_edge.loc[i, ['to_edges']].values[0]\n",
    "\n",
    "        act_1 = df_edge[(df_edge['from_edges'] == f) & (df_edge['to_edges'] == t)].actual_influence.values[0]\n",
    "        act_2 = df_edge[(df_edge['from_edges'] == t) & (df_edge['to_edges'] == f)].actual_influence.values[0]\n",
    "        new_infl.append((act_1 + act_2))\n",
    "    return new_infl"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "fa7ddec7",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|████████████████████████████████████| 13264/13264 [00:16<00:00, 821.68it/s]\n"
     ]
    }
   ],
   "source": [
    "new_infl = []\n",
    "df_edge_copy = df_edge.copy()\n",
    "for i in tqdm(range(len(df_edge))):\n",
    "    f = df_edge.loc[i, ['from_edges']].values[0]\n",
    "    t = df_edge.loc[i, ['to_edges']].values[0]\n",
    "    \n",
    "    act_1 = df_edge[(df_edge['from_edges'] == f) & (df_edge['to_edges'] == t)].actual_influence.values[0]\n",
    "    act_2 = df_edge[(df_edge['from_edges'] == t) & (df_edge['to_edges'] == f)].actual_influence.values[0]\n",
    "    new_infl.append((act_1 + act_2))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "dab5cc40",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_edge_copy['influence'] = new_infl\n",
    "df_edge_preprocessed = df_edge_copy.drop(columns=['actual_influence', 'predicted_influence'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "0cb4092e",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_edge_preprocessed = df_edge_preprocessed.sort_values(['influence'], ascending=False)\n",
    "df_edge_preprocessed.index = range(len(df_edge_preprocessed))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "id": "2968689c",
   "metadata": {},
   "outputs": [],
   "source": [
    "# df_edge_preprocessed_0 = df_edge_preprocessed.copy()\n",
    "# for i in tqdm(range(len(df_edge_preprocessed))):\n",
    "#     src = df_edge_preprocessed.loc[i, ['from_edges']].values[0].astype(int)\n",
    "#     dst = df_edge_preprocessed.loc[i, ['to_edges']].values[0].astype(int)\n",
    "#     index_temp = df_edge_preprocessed[(df_edge_preprocessed['from_edges'] == dst) & \n",
    "#                      (df_edge_preprocessed['to_edges'] == src)].index[0]\n",
    "#     if index_temp:\n",
    "#         df_edge_preprocessed_0 = df_edge_preprocessed_0.drop([index_temp])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 81,
   "id": "22e33a50",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_edge_preprocessed_0 = df_edge_preprocessed.copy()\n",
    "df_edge_preprocessed_0 = df_edge_preprocessed_0.drop_duplicates(subset = ['influence'])\n",
    "df_edge_preprocessed_0['from_edges'] = df_edge_preprocessed_0['from_edges'].astype(int).values\n",
    "df_edge_preprocessed_0['to_edges'] = df_edge_preprocessed_0['to_edges'].astype(int).values\n",
    "df_edge_preprocessed_0.index = range(len(df_edge_preprocessed_0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "id": "60ee1ac5",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "1"
      ]
     },
     "execution_count": 37,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_edge_preprocessed[(df_edge_preprocessed['from_edges'] == dst) & \n",
    "                     (df_edge_preprocessed['to_edges'] == src)].index[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "id": "b2d26630",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>actual influence</th>\n",
       "      <th>node_id</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>15.530282</td>\n",
       "      <td>2079</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>14.665039</td>\n",
       "      <td>1879</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>13.158551</td>\n",
       "      <td>2367</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>12.499614</td>\n",
       "      <td>1716</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>12.212362</td>\n",
       "      <td>1793</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>135</th>\n",
       "      <td>-1.322061</td>\n",
       "      <td>2209</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>136</th>\n",
       "      <td>-1.688545</td>\n",
       "      <td>2658</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>137</th>\n",
       "      <td>-1.981031</td>\n",
       "      <td>542</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>138</th>\n",
       "      <td>-3.037878</td>\n",
       "      <td>138</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>139</th>\n",
       "      <td>-4.082214</td>\n",
       "      <td>432</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>140 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     actual influence  node_id\n",
       "0           15.530282     2079\n",
       "1           14.665039     1879\n",
       "2           13.158551     2367\n",
       "3           12.499614     1716\n",
       "4           12.212362     1793\n",
       "..                ...      ...\n",
       "135         -1.322061     2209\n",
       "136         -1.688545     2658\n",
       "137         -1.981031      542\n",
       "138         -3.037878      138\n",
       "139         -4.082214      432\n",
       "\n",
       "[140 rows x 2 columns]"
      ]
     },
     "execution_count": 62,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_node_preprocessed"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "id": "1b3f4567",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>from_edges</th>\n",
       "      <th>to_edges</th>\n",
       "      <th>influence</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1281</td>\n",
       "      <td>2014</td>\n",
       "      <td>2.605583</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1152</td>\n",
       "      <td>554</td>\n",
       "      <td>2.116021</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1082</td>\n",
       "      <td>1082</td>\n",
       "      <td>1.797256</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>741</td>\n",
       "      <td>741</td>\n",
       "      <td>1.566844</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>2297</td>\n",
       "      <td>1857</td>\n",
       "      <td>1.551643</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13259</th>\n",
       "      <td>1857</td>\n",
       "      <td>1857</td>\n",
       "      <td>-0.993066</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13260</th>\n",
       "      <td>2367</td>\n",
       "      <td>2367</td>\n",
       "      <td>-1.024753</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13261</th>\n",
       "      <td>79</td>\n",
       "      <td>79</td>\n",
       "      <td>-1.777368</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13262</th>\n",
       "      <td>554</td>\n",
       "      <td>554</td>\n",
       "      <td>-2.366645</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13263</th>\n",
       "      <td>1049</td>\n",
       "      <td>1049</td>\n",
       "      <td>-2.785466</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5566 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       from_edges  to_edges  influence\n",
       "0            1281      2014   2.605583\n",
       "2            1152       554   2.116021\n",
       "4            1082      1082   1.797256\n",
       "5             741       741   1.566844\n",
       "6            2297      1857   1.551643\n",
       "...           ...       ...        ...\n",
       "13259        1857      1857  -0.993066\n",
       "13260        2367      2367  -1.024753\n",
       "13261          79        79  -1.777368\n",
       "13262         554       554  -2.366645\n",
       "13263        1049      1049  -2.785466\n",
       "\n",
       "[5566 rows x 3 columns]"
      ]
     },
     "execution_count": 80,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_edge_preprocessed_0"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 102,
   "id": "1e22b402",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>actual influence</th>\n",
       "      <th>node_id</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>9.570093</td>\n",
       "      <td>1281</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    actual influence  node_id\n",
       "14          9.570093     1281"
      ]
     },
     "execution_count": 102,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_node_preprocessed.loc[df_node_preprocessed['node_id'] == 1281]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 263,
   "id": "e14e7b26",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_edge_preprocessed_1 = df_edge_preprocessed_0.copy()\n",
    "f_node_infl = []\n",
    "t_node_infl = []\n",
    "\n",
    "node_ids_temp = df_node_preprocessed['node_id'].values\n",
    "for i in range(len(df_edge_preprocessed_0)):\n",
    "    f_temp_node = df_edge_preprocessed_0.loc[i, ['from_edges']].values[0].astype(int)\n",
    "    t_temp_node = df_edge_preprocessed_0.loc[i, ['to_edges']].values[0].astype(int)\n",
    "\n",
    "    \n",
    "    if f_temp_node in node_ids_temp:\n",
    "        temp_infl_node = df_node_preprocessed.loc[df_node_preprocessed['node_id'] == f_temp_node, \n",
    "                                                  ['actual influence']].values[0][0]\n",
    "        \n",
    "        f_current_node_infl = temp_infl_node\n",
    "    else:\n",
    "        f_current_node_infl = 0.0\n",
    "    \n",
    "    f_node_infl.append(f_current_node_infl)\n",
    "\n",
    "\n",
    "    if t_temp_node in node_ids_temp:\n",
    "        temp_infl_node = df_node_preprocessed.loc[df_node_preprocessed['node_id'] == t_temp_node, \n",
    "                                                  ['actual influence']].values[0][0]\n",
    "        \n",
    "        t_current_node_infl = temp_infl_node\n",
    "    else:\n",
    "        t_current_node_infl = 0.0\n",
    "\n",
    "    t_node_infl.append(t_current_node_infl)\n",
    "    \n",
    "    \n",
    "\n",
    "# df_edge_preprocessed_1['src_node_influence'] = f_node_infl\n",
    "# df_edge_preprocessed_1['dst_node_influence'] = t_node_infl\n",
    "df_edge_preprocessed_1['src_node_influence'] = np.array(f_node_infl) - min(f_node_infl) + 1\n",
    "df_edge_preprocessed_1['dst_node_influence'] = np.array(t_node_infl) - min(t_node_infl) + 1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 264,
   "id": "1aa63133",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([3, 3, 6, ..., 3, 3, 3])"
      ]
     },
     "execution_count": 264,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "labels[df_edge_preprocessed_2['from_edges'].values]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 265,
   "id": "3a3b662f",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_edge_preprocessed_2 = df_edge_preprocessed_1.copy()\n",
    "label_list_f = []\n",
    "label_list_t = []\n",
    "# labels = labels.numpy()\n",
    "for i in range(len(df_edge_preprocessed_1)):\n",
    "    f_id = df_edge_preprocessed_1.loc[i, ['from_edges']].values[0]\n",
    "    f_id = int(f_id)\n",
    "    f_c = labels[f_id]\n",
    "    label_list_f.append(f_c)\n",
    "    \n",
    "    \n",
    "    t_id = df_edge_preprocessed_1.loc[i, ['to_edges']].values[0]\n",
    "    t_id = int(t_id)\n",
    "    t_c = labels[t_id]\n",
    "    label_list_t.append(t_c)\n",
    "df_edge_preprocessed_2['from_node_labels'] = label_list_f\n",
    "df_edge_preprocessed_2['to_node_labels'] = label_list_t"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 350,
   "id": "078341d9",
   "metadata": {},
   "outputs": [],
   "source": [
    "# test_mask = test_mask.numpy()\n",
    "val_mask = val_mask.numpy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 351,
   "id": "6383dd0b",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_edge_preprocessed_3 = df_edge_preprocessed_2.copy()\n",
    "# 0: train, 1:test, 2:\n",
    "train_or_test_list_f = []\n",
    "train_or_test_list_t = []\n",
    "\n",
    "for i in range(len(df_edge_preprocessed_2)):\n",
    "    f_id = df_edge_preprocessed_1.loc[i, ['from_edges']].values[0]\n",
    "    f_id = int(f_id)\n",
    "    t_id = df_edge_preprocessed_1.loc[i, ['to_edges']].values[0]\n",
    "    t_id = int(t_id)\n",
    "    \n",
    "    if train_mask[f_id]:\n",
    "        train_or_test_list_f.append(0)\n",
    "    elif test_mask[f_id]:\n",
    "        train_or_test_list_f.append(1)\n",
    "    else:\n",
    "        train_or_test_list_f.append(2)\n",
    "        \n",
    "    if train_mask[t_id]:\n",
    "        train_or_test_list_t.append(0)\n",
    "    elif test_mask[t_id]:\n",
    "        train_or_test_list_t.append(1)\n",
    "    else:\n",
    "        train_or_test_list_t.append(2)\n",
    "\n",
    "df_edge_preprocessed_3['from_node_train_test'] = train_or_test_list_f\n",
    "df_edge_preprocessed_3['to_node_train_test'] = train_or_test_list_t"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b60589aa",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 267,
   "id": "945bde90",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>from_edges</th>\n",
       "      <th>to_edges</th>\n",
       "      <th>influence</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2014.0</td>\n",
       "      <td>1281.0</td>\n",
       "      <td>2.605583</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>132</th>\n",
       "      <td>2014.0</td>\n",
       "      <td>2014.0</td>\n",
       "      <td>0.344481</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>437</th>\n",
       "      <td>2014.0</td>\n",
       "      <td>1797.0</td>\n",
       "      <td>0.136648</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>784</th>\n",
       "      <td>2014.0</td>\n",
       "      <td>2013.0</td>\n",
       "      <td>0.084075</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>818</th>\n",
       "      <td>2014.0</td>\n",
       "      <td>1280.0</td>\n",
       "      <td>0.080981</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9198</th>\n",
       "      <td>2014.0</td>\n",
       "      <td>1848.0</td>\n",
       "      <td>-0.021757</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13049</th>\n",
       "      <td>2014.0</td>\n",
       "      <td>2419.0</td>\n",
       "      <td>-0.183339</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       from_edges  to_edges  influence\n",
       "1          2014.0    1281.0   2.605583\n",
       "132        2014.0    2014.0   0.344481\n",
       "437        2014.0    1797.0   0.136648\n",
       "784        2014.0    2013.0   0.084075\n",
       "818        2014.0    1280.0   0.080981\n",
       "9198       2014.0    1848.0  -0.021757\n",
       "13049      2014.0    2419.0  -0.183339"
      ]
     },
     "execution_count": 267,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_edge_preprocessed.loc[df_edge_preprocessed['from_edges'] == 2014]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 268,
   "id": "9494df2a",
   "metadata": {},
   "outputs": [],
   "source": [
    "g = dgl.graph(([1, 1, 2, 3, 4], [0, 2, 0, 4, 2]))\n",
    "g0 = dgl.to_networkx(g)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 269,
   "id": "c078c935",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>actual influence</th>\n",
       "      <th>node_id</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>15.530282</td>\n",
       "      <td>2079</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>14.665039</td>\n",
       "      <td>1879</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>13.158551</td>\n",
       "      <td>2367</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>12.499614</td>\n",
       "      <td>1716</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>12.212362</td>\n",
       "      <td>1793</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>135</th>\n",
       "      <td>-1.322061</td>\n",
       "      <td>2209</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>136</th>\n",
       "      <td>-1.688545</td>\n",
       "      <td>2658</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>137</th>\n",
       "      <td>-1.981031</td>\n",
       "      <td>542</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>138</th>\n",
       "      <td>-3.037878</td>\n",
       "      <td>138</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>139</th>\n",
       "      <td>-4.082214</td>\n",
       "      <td>432</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>140 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     actual influence  node_id\n",
       "0           15.530282     2079\n",
       "1           14.665039     1879\n",
       "2           13.158551     2367\n",
       "3           12.499614     1716\n",
       "4           12.212362     1793\n",
       "..                ...      ...\n",
       "135         -1.322061     2209\n",
       "136         -1.688545     2658\n",
       "137         -1.981031      542\n",
       "138         -3.037878      138\n",
       "139         -4.082214      432\n",
       "\n",
       "[140 rows x 2 columns]"
      ]
     },
     "execution_count": 269,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_node_preprocessed"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 290,
   "id": "7b70f18f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>from_edges</th>\n",
       "      <th>to_edges</th>\n",
       "      <th>influence</th>\n",
       "      <th>src_node_influence</th>\n",
       "      <th>dst_node_influence</th>\n",
       "      <th>from_node_labels</th>\n",
       "      <th>to_node_labels</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>5101</th>\n",
       "      <td>2079</td>\n",
       "      <td>2079</td>\n",
       "      <td>-0.096402</td>\n",
       "      <td>20.612496</td>\n",
       "      <td>20.612496</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5417</th>\n",
       "      <td>1879</td>\n",
       "      <td>1059</td>\n",
       "      <td>-0.182723</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5327</th>\n",
       "      <td>1879</td>\n",
       "      <td>2326</td>\n",
       "      <td>-0.140576</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3231</th>\n",
       "      <td>1879</td>\n",
       "      <td>1060</td>\n",
       "      <td>-0.020915</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5486</th>\n",
       "      <td>1879</td>\n",
       "      <td>1879</td>\n",
       "      <td>-0.263894</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>542</td>\n",
       "      <td>542</td>\n",
       "      <td>0.567068</td>\n",
       "      <td>3.101183</td>\n",
       "      <td>3.101183</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1276</th>\n",
       "      <td>542</td>\n",
       "      <td>541</td>\n",
       "      <td>0.025063</td>\n",
       "      <td>3.101183</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>6</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>138</td>\n",
       "      <td>138</td>\n",
       "      <td>0.674173</td>\n",
       "      <td>2.044336</td>\n",
       "      <td>2.044336</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>86</th>\n",
       "      <td>432</td>\n",
       "      <td>749</td>\n",
       "      <td>0.342567</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>432</td>\n",
       "      <td>432</td>\n",
       "      <td>0.843192</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5566 rows × 7 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      from_edges  to_edges  influence  src_node_influence  dst_node_influence  \\\n",
       "5101        2079      2079  -0.096402           20.612496           20.612496   \n",
       "5417        1879      1059  -0.182723           19.747253            5.082214   \n",
       "5327        1879      2326  -0.140576           19.747253            5.082214   \n",
       "3231        1879      1060  -0.020915           19.747253            5.082214   \n",
       "5486        1879      1879  -0.263894           19.747253           19.747253   \n",
       "...          ...       ...        ...                 ...                 ...   \n",
       "35           542       542   0.567068            3.101183            3.101183   \n",
       "1276         542       541   0.025063            3.101183            5.082214   \n",
       "27           138       138   0.674173            2.044336            2.044336   \n",
       "86           432       749   0.342567            1.000000            5.082214   \n",
       "14           432       432   0.843192            1.000000            1.000000   \n",
       "\n",
       "      from_node_labels  to_node_labels  \n",
       "5101                 3               3  \n",
       "5417                 3               3  \n",
       "5327                 3               4  \n",
       "3231                 3               3  \n",
       "5486                 3               3  \n",
       "...                ...             ...  \n",
       "35                   6               6  \n",
       "1276                 6               0  \n",
       "27                   6               6  \n",
       "86                   1               1  \n",
       "14                   1               1  \n",
       "\n",
       "[5566 rows x 7 columns]"
      ]
     },
     "execution_count": 290,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_ede"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1109454f",
   "metadata": {},
   "outputs": [],
   "source": [
    "def neighbors_df(df, node_id):\n",
    "    pass"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 293,
   "id": "8318464d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>from_edges</th>\n",
       "      <th>to_edges</th>\n",
       "      <th>influence</th>\n",
       "      <th>src_node_influence</th>\n",
       "      <th>dst_node_influence</th>\n",
       "      <th>from_node_labels</th>\n",
       "      <th>to_node_labels</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>3231</th>\n",
       "      <td>1879</td>\n",
       "      <td>1060</td>\n",
       "      <td>-0.020915</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5327</th>\n",
       "      <td>1879</td>\n",
       "      <td>2326</td>\n",
       "      <td>-0.140576</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5417</th>\n",
       "      <td>1879</td>\n",
       "      <td>1059</td>\n",
       "      <td>-0.182723</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5486</th>\n",
       "      <td>1879</td>\n",
       "      <td>1879</td>\n",
       "      <td>-0.263894</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>19.747253</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      from_edges  to_edges  influence  src_node_influence  dst_node_influence  \\\n",
       "3231        1879      1060  -0.020915           19.747253            5.082214   \n",
       "5327        1879      2326  -0.140576           19.747253            5.082214   \n",
       "5417        1879      1059  -0.182723           19.747253            5.082214   \n",
       "5486        1879      1879  -0.263894           19.747253           19.747253   \n",
       "\n",
       "      from_node_labels  to_node_labels  \n",
       "3231                 3               3  \n",
       "5327                 3               4  \n",
       "5417                 3               3  \n",
       "5486                 3               3  "
      ]
     },
     "execution_count": 293,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# df_edge_preprocessed_2.to_csv('temp_visulization.csv', index = False)\n",
    "df_edge_preprocessed_2.loc[df_edge_preprocessed_2['from_edges'] == 1879]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 272,
   "id": "919cfd10",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "1293"
      ]
     },
     "execution_count": 272,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.sum(df_edge_preprocessed_2['from_node_labels'] == 3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 314,
   "id": "125c71d6",
   "metadata": {},
   "outputs": [],
   "source": [
    "color_plate = ['pink', 'olive', 'Green','Cyan','Magenta','Yellow', 'Brown', 'Violet']\n",
    "color_plate_edge = ['Red','Blue','black']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 297,
   "id": "1879bc38",
   "metadata": {},
   "outputs": [],
   "source": [
    "def visulize_v1(df_node, df_edge, height='750px', width='100%', bgcolor='#ffffff', font_color=False):\n",
    "    \n",
    "    got_net = Network(height=height, width=width, bgcolor = bgcolor, font_color=font_color)\n",
    "    \n",
    "    \n",
    "    for i in range(len(df_edge)):\n",
    "        src = df_edge.loc[i, ['from_edges']].values[0]\n",
    "        src = int(src)\n",
    "        \n",
    "        dst = df_edge.loc[i, ['to_edges']].values[0]\n",
    "        dst = int(dst)\n",
    "        \n",
    "        \n",
    "        src_color = df_edge.loc[i, ['from_node_labels']].values[0]\n",
    "        src_color = int(src_color)\n",
    "#         print(src_color)\n",
    "        dst_color = df_edge.loc[i, ['to_node_labels']].values[0]\n",
    "        dst_color = int(dst_color)\n",
    "        \n",
    "        \n",
    "        src_infl = df_edge.loc[i, ['src_node_influence']].values[0]\n",
    "        src_infl = float(src_infl)\n",
    "        \n",
    "        dst_infl = df_edge.loc[i, ['dst_node_influence']].values[0]\n",
    "        dst_infl = float(dst_infl)\n",
    "        \n",
    "        \n",
    "        edge_infl = df_edge.loc[i, ['influence']].values[0].astype(float)\n",
    "        \n",
    "        got_net.add_node(n_id = src, title=str(src), size = src_infl, color = color_plate[src_color])\n",
    "        got_net.add_node(n_id = dst, title=str(dst), size = dst_infl, color = color_plate[dst_color])\n",
    "        \n",
    "        got_net.add_edge(src, dst, value=edge_infl)\n",
    "        \n",
    "    got_net.show('graph_influence.html')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 370,
   "id": "be06998e",
   "metadata": {},
   "outputs": [],
   "source": [
    "color_plate = ['pink', 'olive', 'Green','Cyan','Magenta','Yellow', 'Brown', 'Violet']\n",
    "color_plate_edge = ['Red','Blue','black']\n",
    "# type_plate = [\"octagon\", \"X\", \"^\"]\n",
    "type_plate = ['dot', 'star', 'diamond']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 378,
   "id": "71a01858",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 378,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "train_mask[2367]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 377,
   "id": "35473b44",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>from_edges</th>\n",
       "      <th>to_edges</th>\n",
       "      <th>influence</th>\n",
       "      <th>src_node_influence</th>\n",
       "      <th>dst_node_influence</th>\n",
       "      <th>from_node_labels</th>\n",
       "      <th>to_node_labels</th>\n",
       "      <th>from_node_train_test</th>\n",
       "      <th>to_node_train_test</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1281</td>\n",
       "      <td>2014</td>\n",
       "      <td>2.605583</td>\n",
       "      <td>14.652306</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>3</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1152</td>\n",
       "      <td>554</td>\n",
       "      <td>2.116021</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>14.878215</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1082</td>\n",
       "      <td>1082</td>\n",
       "      <td>1.797256</td>\n",
       "      <td>5.413330</td>\n",
       "      <td>5.413330</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>741</td>\n",
       "      <td>741</td>\n",
       "      <td>1.566844</td>\n",
       "      <td>5.069208</td>\n",
       "      <td>5.069208</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>2297</td>\n",
       "      <td>1857</td>\n",
       "      <td>1.551643</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>3</td>\n",
       "      <td>5</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>995</th>\n",
       "      <td>2103</td>\n",
       "      <td>1529</td>\n",
       "      <td>0.038050</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>996</th>\n",
       "      <td>1439</td>\n",
       "      <td>771</td>\n",
       "      <td>0.038038</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>997</th>\n",
       "      <td>2271</td>\n",
       "      <td>2181</td>\n",
       "      <td>0.037987</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>0</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>998</th>\n",
       "      <td>2400</td>\n",
       "      <td>2400</td>\n",
       "      <td>0.037939</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>999</th>\n",
       "      <td>1257</td>\n",
       "      <td>1260</td>\n",
       "      <td>0.037769</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>5.082214</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1000 rows × 9 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     from_edges  to_edges  influence  src_node_influence  dst_node_influence  \\\n",
       "0          1281      2014   2.605583           14.652306            5.082214   \n",
       "1          1152       554   2.116021            5.082214           14.878215   \n",
       "2          1082      1082   1.797256            5.413330            5.413330   \n",
       "3           741       741   1.566844            5.069208            5.069208   \n",
       "4          2297      1857   1.551643            5.082214            5.082214   \n",
       "..          ...       ...        ...                 ...                 ...   \n",
       "995        2103      1529   0.038050            5.082214            5.082214   \n",
       "996        1439       771   0.038038            5.082214            5.082214   \n",
       "997        2271      2181   0.037987            5.082214            5.082214   \n",
       "998        2400      2400   0.037939            5.082214            5.082214   \n",
       "999        1257      1260   0.037769            5.082214            5.082214   \n",
       "\n",
       "     from_node_labels  to_node_labels  from_node_train_test  \\\n",
       "0                   3               0                     0   \n",
       "1                   3               3                     1   \n",
       "2                   6               6                     0   \n",
       "3                   1               1                     0   \n",
       "4                   3               5                     1   \n",
       "..                ...             ...                   ...   \n",
       "995                 2               2                     2   \n",
       "996                 2               2                     2   \n",
       "997                 0               3                     1   \n",
       "998                 3               3                     2   \n",
       "999                 6               6                     1   \n",
       "\n",
       "     to_node_train_test  \n",
       "0                     1  \n",
       "1                     0  \n",
       "2                     0  \n",
       "3                     0  \n",
       "4                     2  \n",
       "..                  ...  \n",
       "995                   2  \n",
       "996                   1  \n",
       "997                   1  \n",
       "998                   2  \n",
       "999                   2  \n",
       "\n",
       "[1000 rows x 9 columns]"
      ]
     },
     "execution_count": 377,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_edge_preprocessed_3[0:1000]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 372,
   "id": "53f822c4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def visulize_v2(df_node, df_edge, height='750px', width='100%', bgcolor='#ffffff', \n",
    "                font_color=False, bar_infl_edge = 0.09):\n",
    "    \n",
    "    got_net = Network(height=height, width=width, bgcolor = bgcolor, font_color=font_color)\n",
    "    \n",
    "    \n",
    "    for i in range(len(df_edge)):\n",
    "        src = df_edge.loc[i, ['from_edges']].values[0]\n",
    "        src = int(src)\n",
    "        \n",
    "        dst = df_edge.loc[i, ['to_edges']].values[0]\n",
    "        dst = int(dst)\n",
    "        \n",
    "        \n",
    "        src_color = df_edge.loc[i, ['from_node_labels']].values[0]\n",
    "        src_color = int(src_color)\n",
    "#         print(src_color)\n",
    "        dst_color = df_edge.loc[i, ['to_node_labels']].values[0]\n",
    "        dst_color = int(dst_color)\n",
    "        \n",
    "        \n",
    "        src_infl = df_edge.loc[i, ['src_node_influence']].values[0]\n",
    "        src_infl = float(src_infl)\n",
    "        \n",
    "        dst_infl = df_edge.loc[i, ['dst_node_influence']].values[0]\n",
    "        dst_infl = float(dst_infl)\n",
    "        \n",
    "        \n",
    "        edge_infl = df_edge.loc[i, ['influence']].values[0].astype(float)\n",
    "        \n",
    "        \n",
    "        src_train_test = df_edge.loc[i, ['from_node_train_test']].values[0]\n",
    "        src_train_test = int(src_train_test)\n",
    "        \n",
    "        dst_train_test = df_edge.loc[i, ['to_node_train_test']].values[0]\n",
    "        dst_train_test = int(src_train_test)\n",
    "        \n",
    "        \n",
    "        if edge_infl >= bar_infl_edge:\n",
    "            color_edge = color_plate_edge[0]\n",
    "            value_edge = abs(edge_infl)\n",
    "            \n",
    "        elif (edge_infl >= 0) and (edge_infl < bar_infl_edge):\n",
    "            color_edge = color_plate_edge[2]\n",
    "            value_edge = abs(edge_infl) + 0.1\n",
    "        else:\n",
    "            color_edge = color_plate_edge[1]\n",
    "            value_edge = abs(edge_infl)\n",
    "        \n",
    "        \n",
    "        if src_train_test == 0:\n",
    "            src_node_type = type_plate[0]\n",
    "        elif src_train_test == 1:\n",
    "            src_node_type = type_plate[1]\n",
    "        else:\n",
    "            src_node_type = type_plate[2]\n",
    "            \n",
    "        if dst_train_test == 0:\n",
    "            dst_node_type = type_plate[0]\n",
    "        elif dst_train_test == 1:\n",
    "            dst_node_type = type_plate[1]\n",
    "        else:\n",
    "            dst_node_type = type_plate[2]\n",
    "            \n",
    "#         print(src_node_type)\n",
    "#         got_net.add_node(n_id = src, title=str(src), size = src_infl, color = color_plate[src_color])\n",
    "#         got_net.add_node(n_id = dst, title=str(dst), size = dst_infl, color = color_plate[dst_color])\n",
    "        got_net.add_node(n_id = src, title=str(src), size = src_infl, \n",
    "                         color = color_plate[src_color], shape = src_node_type)\n",
    "        got_net.add_node(n_id = dst, title=str(dst), size = dst_infl, \n",
    "                         color = color_plate[dst_color], shape = dst_node_type)\n",
    "        \n",
    "        got_net.add_edge(src, dst, value=value_edge, color = color_edge)\n",
    "        \n",
    "    got_net.show('graph_influence_v2.html')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 373,
   "id": "6228c409",
   "metadata": {},
   "outputs": [],
   "source": [
    "# df_edge_preprocessed_2.loc[:, ['influence']].values[0].astype(float)\n",
    "edge_infl_array = df_edge_preprocessed_2.loc[:, ['influence']].values.astype(float).reshape(-1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 374,
   "id": "7333bf7c",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.07411980334984485"
      ]
     },
     "execution_count": 374,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.quantile(edge_infl_array, 0.9)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 375,
   "id": "b62d349c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "dot\n",
      "star\n",
      "dot\n",
      "dot\n",
      "star\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "star\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "star\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "star\n",
      "dot\n",
      "dot\n",
      "star\n",
      "star\n",
      "star\n",
      "star\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "dot\n",
      "star\n",
      "star\n",
      "star\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "dot\n",
      "star\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "dot\n",
      "dot\n",
      "star\n",
      "star\n",
      "star\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "star\n",
      "dot\n",
      "star\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "star\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "star\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "star\n",
      "star\n",
      "star\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "dot\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "dot\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "dot\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "star\n",
      "dot\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "diamond\n",
      "dot\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "diamond\n",
      "star\n",
      "diamond\n",
      "star\n"
     ]
    }
   ],
   "source": [
    "visulize_v2(df_node_feature, df_edge_preprocessed_3[0:1000])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 302,
   "id": "8dae6e44",
   "metadata": {},
   "outputs": [],
   "source": [
    "visulize_v1(df_node_feature, df_edge_preprocessed_2[0:1000])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 303,
   "id": "a1176987",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "953"
      ]
     },
     "execution_count": 303,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_edge.loc[i, ['from_edges']].values[0].astype(int)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 304,
   "id": "e1d89672",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 304,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "isinstance(int(df_edge.loc[i, ['from_edges']].values[0]), int)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 385,
   "id": "4e163e0a",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAYIAAAD4CAYAAADhNOGaAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/MnkTPAAAACXBIWXMAAAsTAAALEwEAmpwYAAAdEklEQVR4nO3de3RU1d3/8fc3wYgNVlEicqtBS0UkMQkhRCCI3EHES0GxgKCLUrSotT/lQVlUa2uXF6pUiyBYAS0FqXgBi1VUolxESQADRIxIU5oHRLCPFMHIxf37I8M0hAlMMjO5sD+vtc7KnL33OWdvZi0+c86Zs8ecc4iIiL/iarsDIiJSuxQEIiKeUxCIiHhOQSAi4jkFgYiI5xrUdgeqo0mTJi45Obm2uyEiUq/k5+fvds4lVSyvl0GQnJxMXl5ebXdDRKReMbN/hirXpSEREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc9FJQjMrJ+ZfWJmW8xsQoh6M7MnAvUFZpZRoT7ezNaZ2WvR6I+IiIQv4iAws3hgKtAfaAfcYGbtKjTrD7QJLGOAaRXq7wA+jrQvIiJSddE4I8gCtjjntjrnDgDzgasqtLkKeM6VWQ2caWbNAMysJXAF8EwU+iIiIlUUjSBoAfyr3HpJoCzcNlOA8cB3xzuImY0xszwzy9u1a1dEHRYRkf+KRhBYiDIXThszGwh84ZzLP9FBnHMznHOZzrnMpKSk6vRTRERCiEYQlACtyq23BLaH2aYLMMjMiim7pNTDzP4chT6JiEiYohEEa4A2ZtbazBKAocCiCm0WATcGvj2UDexxzu1wzt3jnGvpnEsObPeOc254FPokIiJhahDpDpxzh8xsHPAGEA8865zbZGZjA/XTgSXAAGALsB+4KdLjiohIdJhzFS/n132ZmZkuLy+vtrshIlKvmFm+cy6zYrmeLBYR8ZyCQETEcwoCERHPKQhERDynIBAR8ZyCQETEcwoCERHPKQhERDynIBAR8ZyCQETEcwoCERHPKQhERDynIBAR8ZyCQETEcwoCERHPKQhERDynIBAR8ZyCQETEcwoCERHPKQhERDynIBAR8ZyCQETEcwoCERHPKQhERDynIBAR8ZyCQETEcwoCERHPKQhERDynIBAR8ZyCQETEc1EJAjPrZ2afmNkWM5sQot7M7IlAfYGZZQTKW5nZMjP72Mw2mdkd0eiPiIiEL+IgMLN4YCrQH2gH3GBm7So06w+0CSxjgGmB8kPA/3POXQRkAz8Psa2IiMRQNM4IsoAtzrmtzrkDwHzgqgptrgKec2VWA2eaWTPn3A7n3FoA59xe4GOgRRT6JCIiYYpGELQA/lVuvYRj/zM/YRszSwbSgQ+i0CcREQlTNILAQpS5qrQxs0bAQuAXzrn/hDyI2RgzyzOzvF27dlW7syIicrRoBEEJ0Krcektge7htzOwUykJgrnPupcoO4pyb4ZzLdM5lJiUlRaHbIiIC0QmCNUAbM2ttZgnAUGBRhTaLgBsD3x7KBvY453aYmQF/Aj52zj0Whb6IiEgVNYh0B865Q2Y2DngDiAeedc5tMrOxgfrpwBJgALAF2A/cFNi8CzAC2GBm6wNl9zrnlkTaLxERCY85V/Fyft2XmZnp8vLyarsbIiL1ipnlO+cyK5bryWIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxnIJARMRzCgIREc8pCEREPKcgEBHxXFSCwMz6mdknZrbFzCaEqDczeyJQX2BmGeFuKyIisRVxEJhZPDAV6A+0A24ws3YVmvUH2gSWMcC0KmwrIiIxFI0zgixgi3Nuq3PuADAfuKpCm6uA51yZ1cCZZtYszG1FRCSGohEELYB/lVsvCZSF0yacbQEwszFmlmdmebt27Yq40yIiUiYaQWAhylyYbcLZtqzQuRnOuUznXGZSUlIVu1jBqvXwbt6xy6r1ke23EqNHj6awsPC4bUaNGsWLL74Yk+OLiBxPgyjsowRoVW69JbA9zDYJYWwbfQcPVa08Qs8880xM9isiEg3ROCNYA7Qxs9ZmlgAMBRZVaLMIuDHw7aFsYI9zbkeY29YbxcXFtG3blpEjR5KamsrgwYPZv38/3bt3Jy8vD4BGjRoxceJELrnkErKzs9m5c+cx+5k0aRKjRo3iu+++q+khiIiHIg4C59whYBzwBvAxsMA5t8nMxprZ2ECzJcBWYAswE7j1eNtG2qfa9MknnzBmzBgKCgr4/ve/z1NPPXVU/b59+8jOzuajjz6iW7duzJw586j68ePH88UXXzBr1izi4vSYh4jEXjQuDeGcW0LZf/bly6aXe+2An4e7bX3WqlUrunTpAsDw4cN54oknjqpPSEhg4MCBAHTo0IGlS5cG637zm9/QqVMnZsyYUXMdFhHv6SNnlJnZcddPOeWUYFl8fDyHDv33vkTHjh3Jz8/n3//+d+w7KiIS4GcQnFLJiVBl5VWwbds23n//fQDmzZtH165dw962X79+TJgwgSuuuIK9e/dG3BcRkXBE5dJQvdM5LWa7vuiii5gzZw4/+9nPaNOmDbfccguLFy8Oe/shQ4awd+9eBg0axJIlSzjttNNi1lcREQAru3xfv2RmZroj38KpS4qLixk4cCAbN26s7a6IiBzDzPKdc5kVy/28NCQiIkEKgihKTk7W2YCI1DsKAhERzykIREQ8pyAQEfGcgkBExHNePkcwefK57Nt37GRviYlNueuuz6N6rEaNGvH111+zfft2br/9dk01LSJ1jpdnBKFC4Hjl0dC8eXOFgIjUSV4GQaw89thjtG/fnvbt2zNlypSj6oqLi2nfvj0AnTp1YtOm/06y2r17d/Lz89m3bx8333wzHTt2JD09nVdffbUmuy8inlIQREl+fj6zZs3igw8+YPXq1cycOZN169aFbDt06FAWLFgAwI4dO9i+fTsdOnTgwQcfpEePHqxZs4Zly5Zx9913s2/fvpochoh4SEEQJStWrOCaa64hMTGRRo0ace2117J8+fKQba+77jr++te/ArBgwQKGDBkCwJtvvslDDz1EWloa3bt3p7S0lG3bttXYGETET17eLI6FqszZ1KJFC84++2wKCgp44YUXePrpp4P7WLhwIRdeeGGsuikicgwvzwgSE5tWqTwc3bp145VXXmH//v3s27ePl19+mZycnErbDx06lEceeYQ9e/aQkpICQN++fXnyySeDoVLZpSURkWjy8owg2l8RBcjIyGDUqFFkZWUBMHr0aNLT0yttP3jwYO644w4mTZoULJs0aRK/+MUvSE1NxTlHcnIyr732WtT7KiJSnqahFhHxhKahFhGRkBQEIiKeUxCIiHhOQSAi4jkFgYiI5xQEIiKe8/I5gnMnn8vOEDONNk1syucRPGOwc+dO7rzzTlavXk3jxo1JSEhg/PjxXHPNNZF0V0Qkprw8IwgVAscrD4dzjquvvppu3bqxdetW8vPzmT9/PiUlJUe1O3ToULWPISISC14GQSy88847JCQkMHbs2GDZeeedx2233cbs2bMZMmQIV155JX369Kl0uunDhw9z991307FjR1JTU4NzEOXm5tK9e3cGDx5M27ZtGTZsWJXmNhIROR4vLw3FwqZNm8jIyKi0/v3336egoICzzjqLe++9lx49evDss8/y1VdfkZWVRa9evZg7dy5nnHEGa9as4dtvv6VLly706dMHKJt3aNOmTTRv3pwuXbqwcuVKunbtWlPDE5GTmM4IYuTnP/85l1xyCR07dgSgd+/enHXWWUDl002/+eabPPfcc6SlpdGpUye+/PJLPv30UwCysrJo2bIlcXFxpKWlUVxcXFtDE5GTTERnBGZ2FvACkAwUA9c55/4vRLt+wB+AeOAZ59xDgfJHgSuBA8BnwE3Oua8i6VNtufjii1m4cGFwferUqezevZvMzLJpPRITE4N1lU037ZzjySefpG/fvkeV5+bmcuqppwbX4+Pjda9BRKIm0jOCCcDbzrk2wNuB9aOYWTwwFegPtANuMLN2geqlQHvnXCpQBNwTYX/C0rSS6aYrKw9Hjx49KC0tZdq0acGy/fv3h2xb2XTTffv2Zdq0aRw8eBCAoqIi/UKZiMRcpPcIrgK6B17PAXKB/6nQJgvY4pzbCmBm8wPbFTrn3izXbjUwOML+hCWSr4hWxsx45ZVXuPPOO3nkkUdISkoiMTGRhx9+mG+++eaotpVNNz169GiKi4vJyMjAOUdSUhKvvPJK1PsqIlJeRNNQm9lXzrkzy63/n3OucYU2g4F+zrnRgfURQCfn3LgK7RYDLzjn/nyi42oaahGRqqtsGuoTnhGY2VvAuSGqJoZ77BBlR6WPmU0EDgFzj9OPMcAYgB/84AdhHlpERE7khEHgnOtVWZ2Z7TSzZs65HWbWDPgiRLMSoFW59ZbA9nL7GAkMBHq645yeOOdmADOg7IzgRP0WEZHwRHqzeBEwMvB6JPBqiDZrgDZm1trMEoChge2OfJvof4BBzrnQd1ZFRCSmIg2Ch4DeZvYp0Duwjpk1N7MlAM65Q8A44A3gY2CBc25TYPs/AqcDS81svZlNj7A/IiJSRRF9a8g59yXQM0T5dmBAufUlwJIQ7X4YyfFFRCRyerJYRMRzXgbBuZR9laniEuqrUVXx+eefM3ToUC644ALatWvHgAEDKCoqinCvIiKx5WUQVDbZdPUnoS6bHuKaa66he/fufPbZZxQWFvK73/2OnTsj2auISOx5GQSxsGzZMk455ZSjpqFOS0tjxowZwWmmAYYNG8aiRYsoLi4mJyeHjIwMMjIyWLVqFaApp0Wk5ikIomTjxo106NDhmPLRo0cza9YsAPbs2cOqVasYMGAA55xzDkuXLmXt2rW88MIL3H777cFt1q1bx5QpUygsLGTr1q2sXLmyxsYhIv5REMTYZZddxpYtW/jiiy+YN28eP/7xj2nQoAEHDx7kpz/9KSkpKQwZMoTCwsLgNppyWkRqkn6YJkouvvhiXnzxxZB1I0aMYO7cucyfP59nn30WgMcff5ymTZvy0Ucf8d1339GwYcNge005LSI1ycszgsomm67+JNRl01B/++23zJw5M1i2Zs0a3n33XUaNGsWUKVOAssCAsstEzZo1Iy4ujueff57Dhw9HcHQRkerzMgg+p2zWu4pLJJNTmxkvv/wyS5cu5YILLuDiiy/m/vvvp3nz5jRt2pSLLrqIm266Kdj+1ltvZc6cOWRnZ1NUVHTUD9eIiNSkiKahri31bRrq/fv3k5KSwtq1aznjjDNquzsi4qnKpqH28oygJr311lu0bduW2267TSEgInWSbhbHWK9evdi2bVttd0NEpFI6IxAR8ZyCQETEcwoCERHPKQhERDznZxDEaB5qM2PEiBHB9UOHDpGUlMTAgQMj23EV5ObmBiewExEJh59BEIt5qIHExEQ2btzIN998A8DSpUtp0aJFZDutIgWBiFSVn0EQQ/379+dvf/sbAPPmzeOGG24I1n344Yd07tyZ9PR0OnfuzCeffAKUPXB23XXXkZqayvXXX0+nTp048sDcm2++yaWXXkpGRgZDhgzh66+/BiA5OZn77ruPjIwMUlJS2Lx5M8XFxUyfPp3HH3+ctLQ0li9fzuLFi+nUqRPp6en06tVLv48gIsdQEETZ0KFDmT9/PqWlpRQUFNCpU6dgXdu2bXnvvfdYt24dDzzwAPfeey8ATz31FI0bN6agoIBJkyaRn58PwO7du/ntb3/LW2+9xdq1a8nMzOSxxx4L7q9JkyasXbuWW265hcmTJ5OcnMzYsWO58847Wb9+PTk5OXTt2pXVq1ezbt06hg4dyiOPPFKz/yAiUufpgbIoS01Npbi4mHnz5jFgwICj6vbs2cPIkSP59NNPMTMOHjwIwIoVK7jjjjsAaN++PampqQCsXr2awsJCunTpAsCBAwe49NJLg/u79tprAejQoQMvvfRSyP6UlJRw/fXXs2PHDg4cOEDr1q2jO2ARqfd0RhADgwYN4q677jrqshDApEmTuPzyy9m4cSOLFy+mtLQUoNJfIHPO0bt3b9avX8/69espLCzkT3/6U7D+yHTVx5uq+rbbbmPcuHFs2LCBp59+OnhMEZEj/AyCWMxDXc7NN9/Mr371K1JSUo4q37NnT/Dm8ezZs4PlXbt2ZcGCBQAUFhayYcMGALKzs1m5ciVbtmwByu4lFBUVHffYp59+Onv37g15zDlz5kQ2MBE5KfkZBLGYh7qcli1bBi/1lDd+/HjuueceunTpctTvD9x6663s2rWL1NRUHn74YVJTUznjjDNISkpi9uzZ3HDDDaSmppKdnc3mzZuPe+wrr7ySl19+OXiz+P7772fIkCHk5OTQpEmT6AxQRE4qmoa6Djh8+DAHDx6kYcOGfPbZZ/Ts2ZOioiISEhJqu2sichKpbBpq3SyuA/bv38/ll1/OwYMHcc4xbdo0hYCI1BgFQR1w+umnczKd4YhI/eLnPQIREQlSEIiIeE5BICLiOQWBiIjnIgoCMzvLzJaa2aeBv40radfPzD4xsy1mNiFE/V1m5syshr7oHv15qJ1zdO3alddffz1YtmDBAvr163dM29zc3ODU1LNnz2bcuHHVPq6ISKQiPSOYALztnGsDvB1YP4qZxQNTgf5AO+AGM2tXrr4V0BuowV94j/481GbG9OnT+eUvf0lpaSn79u1j4sSJTJ06tdr7FBGpCZEGwVXAkXkL5gBXh2iTBWxxzm11zh0A5ge2O+JxYDxlz/bWa+3bt+fKK6/k4Ycf5te//jXDhw/nwQcfpGPHjqSnp/Pqq68ed/t//vOf9OzZk9TUVHr27Mm2bds4fPgw559/Ps45vvrqK+Li4njvvfcAyMnJCU4/ISJSXZEGQVPn3A6AwN9zQrRpAfyr3HpJoAwzGwT8r3PuoxMdyMzGmFmemeXt2rUrwm7Hzn333cdf/vIXXn/9dUpLS+nRowdr1qxh2bJl3H333ezbt6/SbceNG8eNN95IQUEBw4YN4/bbbyc+Pp4f/ehHFBYWsmLFCjp06MDy5cv59ttvKSkp4Yc//GENjk5ETkYnfKDMzN4i9MXziWEew0KUOTP7XmAffcLZiXNuBjADyqaYCPPYNS4xMZHrr7+eRo0asWDBAhYvXszkyZMBKC0tZdu2yq+Avf/++8HppEeMGMH48eOBsk/+7733Hv/4xz+45557mDlzJpdddhkdO3aM/YBE5KR3wiBwzvWqrM7MdppZM+fcDjNrBnwRolkJ0KrcektgO3AB0Br4yMyOlK81syznXJSmf6sdcXFxxMXF4Zxj4cKFXHjhhUfVh/srYYF/F3Jycpg+fTrbt2/ngQce4NFHHyU3N5du3bpFve8i4p9ILw0tAkYGXo8EQl0EXwO0MbPWZpYADAUWOec2OOfOcc4lO+eSKQuMjJoJgRjPQx3Qt29fnnzyyeDvDaxbt+647Tt37sz8+fMBmDt3Ll27dgWgU6dOrFq1iri4OBo2bEhaWhpPP/00OTk5Ue2viPgp0iB4COhtZp9S9s2fhwDMrLmZLQFwzh0CxgFvAB8DC5xzmyI8boRiPA91wKRJkzh48CCpqam0b9+eSZMmHbf9E088waxZs0hNTeX555/nD3/4A1D2AzStWrUiOzsbKDtD2Lt37zG/dyAiUh2ahlpExBOVTUOtJ4tFRDynIBAR8ZyCQETEcwoCERHPKQhERDynIBAR8ZyXv1n8UrdulH755THlDc8+m2sDE7pVR3x8PCkpKTjniI+P549//COdO3eOpKsiIjHnZRCECoHjlYfrtNNOY/369QC88cYb3HPPPbz77rtHtTl8+DDx8fERHUdEJJp0aShG/vOf/9C4cdnv9OTm5nL55Zfzk5/8hJSUFEpLS7nppptISUkhPT2dZcuWATBgwAAKCgoASE9P54EHHgDKnlB+5plnyM3NpXv37gwePJi2bdsybNgw6uMDgSJSt3h5RhAr33zzDWlpaZSWlrJjxw7eeeedYN2HH37Ixo0bad26Nb///e8B2LBhA5s3b6ZPnz4UFRXRrVs3li9fTnJyMg0aNGDlypUArFixguHDh7Njxw7WrVvHpk2baN68OV26dGHlypXBOYlERKpDZwRRdOTS0ObNm/n73//OjTfeGPzEnpWVRevWrYGy/9hHjBgBQNu2bTnvvPMoKioKTje9YsUKrrjiCr7++mv2799PcXFxcAbTrKwsWrZsSVxcHGlpaRQXF9fKWEXk5KEzghi59NJL2b17N0d+RCcxMTFYV9nlnI4dO5KXl8f5559P79692b17NzNnzqRDhw7BNqeeemrwdXx8PIcOHYrRCETEF16eETQ8++wqlVfH5s2bOXz4MGeH2Ge3bt2YO3cuAEVFRWzbto0LL7yQhIQEWrVqxYIFC8jOziYnJ4fJkydrumkRiSkvzwgi+Yro8Ry5RwBln/rnzJkT8htCt956K2PHjiUlJYUGDRowe/bs4Cf9nJwc3n77bb73ve+Rk5NDSUmJgkBEYkrTUIuIeELTUIuISEgKAhERzykIREQ8pyAQEfGcgkBExHMKAhERzykIREQ8pyAQEfGcgkBExHP18sliM9sF/LO2+1ENTYDdtd2JGuTbeEFj9kV9HfN5zrmkioX1MgjqKzPLC/V498nKt/GCxuyLk23MujQkIuI5BYGIiOcUBDVrRm13oIb5Nl7QmH1xUo1Z9whERDynMwIREc8pCEREPKcgiCIzO8vMlprZp4G/jStp18/MPjGzLWY2IUT9XWbmzKxJ7HsdmUjHbGaPmtlmMysws5fN7Mwa63wVhfG+mZk9EagvMLOMcLetq6o7ZjNrZWbLzOxjM9tkZnfUfO+rJ5L3OVAfb2brzOy1mut1hJxzWqK0AI8AEwKvJwAPh2gTD3wGnA8kAB8B7crVtwLeoOyBuSa1PaZYjxnoAzQIvH441PZ1YTnR+xZoMwB4HTAgG/gg3G3r4hLhmJsBGYHXpwNFJ/uYy9X/EvgL8FptjyfcRWcE0XUVMCfweg5wdYg2WcAW59xW59wBYH5guyMeB8YD9eUufkRjds696Zw7FGi3GmgZ2+5W24neNwLrz7kyq4EzzaxZmNvWRdUes3Nuh3NuLYBzbi/wMdCiJjtfTZG8z5hZS+AK4Jma7HSkFATR1dQ5twMg8PecEG1aAP8qt14SKMPMBgH/65z7KNYdjaKIxlzBzZR90qqLwhlDZW3CHX9dE8mYg8wsGUgHPoh+F6Mu0jFPoeyD3Hcx6l9MNKjtDtQ3ZvYWcG6Iqonh7iJEmTOz7wX20ae6fYuVWI25wjEmAoeAuVXrXY054RiO0yacbeuiSMZcVmnWCFgI/MI5958o9i1Wqj1mMxsIfOGcyzez7tHuWCwpCKrIOdersjoz23nktDhwqvhFiGYllN0HOKIlsB24AGgNfGRmR8rXmlmWc+7zqA2gGmI45iP7GAkMBHq6wEXWOui4YzhBm4Qwtq2LIhkzZnYKZSEw1zn3Ugz7GU2RjHkwMMjMBgANge+b2Z+dc8Nj2N/oqO2bFCfTAjzK0TdOHwnRpgGwlbL/9I/cjLo4RLti6sfN4ojGDPQDCoGk2h7LCcZ5wveNsmvD5W8ifliV97yuLRGO2YDngCm1PY6aGnOFNt2pRzeLa70DJ9MCnA28DXwa+HtWoLw5sKRcuwGUfYviM2BiJfuqL0EQ0ZiBLZRdb10fWKbX9piOM9ZjxgCMBcYGXhswNVC/AcisynteF5fqjhnoStkllYJy7+2A2h5PrN/ncvuoV0GgKSZERDynbw2JiHhOQSAi4jkFgYiI5xQEIiKeUxCIiHhOQSAi4jkFgYiI5/4/revdkmiNC24AAAAASUVORK5CYII=\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "\n",
    "colors = ['pink', 'olive', 'Green','Cyan','Magenta','Yellow', 'Brown']\n",
    "f = lambda m,c: plt.plot([],[],marker=m, color=c, ls=\"none\")[0]\n",
    "handles = [f(\"s\", colors[i]) for i in range(7)]\n",
    "labels = colors\n",
    "legend = plt.legend(handles, labels, loc=3, framealpha=1, frameon=False)\n",
    "\n",
    "def export_legend(legend, filename=\"legend.png\"):\n",
    "    fig  = legend.figure\n",
    "    fig.canvas.draw()\n",
    "    bbox  = legend.get_window_extent().transformed(fig.dpi_scale_trans.inverted())\n",
    "    fig.savefig(filename, dpi=\"figure\", bbox_inches=bbox)\n",
    "\n",
    "export_legend(legend)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 382,
   "id": "824f22f1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<matplotlib.lines.Line2D at 0x7fd80550ad00>,\n",
       " <matplotlib.lines.Line2D at 0x7fd805d09a90>,\n",
       " <matplotlib.lines.Line2D at 0x7fd805d67280>]"
      ]
     },
     "execution_count": 382,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import pylab\n",
    "fig = pylab.figure()\n",
    "figlegend = pylab.figure(figsize=(3,2))\n",
    "ax = fig.add_subplot(111)\n",
    "lines = ax.plot(range(10), pylab.randn(10), range(10), pylab.randn(10))\n",
    "figlegend.legend(lines, ('one', 'two'), 'center')\n",
    "fig.show()\n",
    "figlegend.show()\n",
    "figlegend.savefig('legend.png')"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
