{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from matplotlib_venn import venn3\n",
    "import networkx as nx"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "sys.path.append('../../code')\n",
    "\n",
    "import min_vertex_k_cut"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>smiles</th>\n",
       "      <th>value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Brc1ccc(-c2nc3ccc(Nc4ccnc5ccccc45)cc3[nH]2)cc1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Brc1ccc(-c2nc3ccc(Nc4ncnc5ccccc45)cc3[nH]2)cc1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Brc1cccc(Nc2ncnc3ccc(NCc4ccc5c(c4)OCCCO5)cc23)c1</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>C#CC(C)OC1=CC(=O)C(Nc2ncnc3cc(OCCCN4CCCC4)c(OC...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>C#CC(OC1=CC(=O)C(Nc2ncnc3cc(OCCCN4CCCC4)c(OC)c...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6272</th>\n",
       "      <td>c1cn(Cc2ccc3c(c2)-c2[nH]nc(-c4ccsc4)c2C3)cn1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6273</th>\n",
       "      <td>c1cnc(CCc2ccncc2)c(-c2nnc(NCc3ccc4c(c3)OCO4)o2)c1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6274</th>\n",
       "      <td>c1cnc(CCc2ccncc2)c(-c2nnc(Nc3cnc4ccccc4c3)o2)c1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6275</th>\n",
       "      <td>c1cncc(-c2cnn3cc(-c4ccc(OCCN5CCCCC5)cc4)cnc23)c1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6276</th>\n",
       "      <td>c1csc(-c2n[nH]c3c2Cc2ccccc2-3)c1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>6277 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 smiles  value\n",
       "0        Brc1ccc(-c2nc3ccc(Nc4ccnc5ccccc45)cc3[nH]2)cc1   True\n",
       "1        Brc1ccc(-c2nc3ccc(Nc4ncnc5ccccc45)cc3[nH]2)cc1   True\n",
       "2      Brc1cccc(Nc2ncnc3ccc(NCc4ccc5c(c4)OCCCO5)cc23)c1  False\n",
       "3     C#CC(C)OC1=CC(=O)C(Nc2ncnc3cc(OCCCN4CCCC4)c(OC...   True\n",
       "4     C#CC(OC1=CC(=O)C(Nc2ncnc3cc(OCCCN4CCCC4)c(OC)c...   True\n",
       "...                                                 ...    ...\n",
       "6272       c1cn(Cc2ccc3c(c2)-c2[nH]nc(-c4ccsc4)c2C3)cn1   True\n",
       "6273  c1cnc(CCc2ccncc2)c(-c2nnc(NCc3ccc4c(c3)OCO4)o2)c1   True\n",
       "6274    c1cnc(CCc2ccncc2)c(-c2nnc(Nc3cnc4ccccc4c3)o2)c1   True\n",
       "6275   c1cncc(-c2cnn3cc(-c4ccc(OCCN5CCCCC5)cc4)cnc23)c1   True\n",
       "6276                   c1csc(-c2n[nH]c3c2Cc2ccccc2-3)c1   True\n",
       "\n",
       "[6277 rows x 2 columns]"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "kdr_hi = pd.read_csv('../../data/raw/kdr_hi.csv', index_col=0)\n",
    "kdr_hi"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "smiles = kdr_hi['smiles'].to_list()\n",
    "threshold = 0.4\n",
    "\n",
    "neighborhood_graph = min_vertex_k_cut.get_neighborhood_graph(smiles, threshold)\n",
    "main_component, small_components = min_vertex_k_cut.get_main_component(neighborhood_graph)\n",
    "\n",
    "old_nodes_to_new = dict(zip(main_component.nodes(), range(main_component.number_of_nodes())))\n",
    "new_nodes_to_old = {v: k for k, v in old_nodes_to_new.items()}\n",
    "main_component = nx.relabel_nodes(main_component, old_nodes_to_new)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.9 5270 123.22542694497153\n",
      "0.8 3313 65.42952007244189\n",
      "0.7 1590 28.057861635220124\n",
      "0.6 854 15.704918032786885\n",
      "0.5 506 11.1699604743083\n",
      "0.4 295 9.152542372881356\n"
     ]
    }
   ],
   "source": [
    "for coarse_threhold in [0.90, 0.80, 0.70, 0.60, 0.50, 0.40]:\n",
    "    coarsed_main_component, _ = min_vertex_k_cut.coarse_graph(main_component, coarse_threhold)\n",
    "    node_degrees = list(dict(coarsed_main_component.degree()).values())\n",
    "    print(coarse_threhold, len(coarsed_main_component), np.mean(node_degrees))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "coarsed_main_component, node_to_cluster = min_vertex_k_cut.coarse_graph(main_component, 0.4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total molecules: 5710\n",
      "Min size of a partition: 856\n",
      "Welcome to the CBC MILP Solver \n",
      "Version: Trunk\n",
      "Build Date: Oct 24 2021 \n",
      "\n",
      "Starting solution of the Linear programming relaxation problem using Primal Simplex\n",
      "\n",
      "Coin0506I Presolve 7513 (-885) rows, 885 (0) columns and 16200 (-1770) elements\n",
      "Clp1000I sum of infeasibilities 4.1514e-06 - average 5.52563e-10, 0 fixed columns\n",
      "Coin0506I Presolve 7513 (0) rows, 885 (0) columns and 16200 (0) elements\n",
      "Clp0029I End of values pass after 885 iterations\n",
      "Clp0000I Optimal - objective value 5710\n",
      "Clp0000I Optimal - objective value 5710\n",
      "Clp0000I Optimal - objective value 5710\n",
      "Coin0511I After Postsolve, objective 5710, infeasibilities - dual 0 (0), primal 0 (0)\n",
      "Clp0032I Optimal objective 5710 - 0 iterations time 0.302, Presolve 0.00, Idiot 0.30\n",
      "\n",
      "Starting MIP optimization\n",
      "Cgl0003I 0 fixed, 0 tightened bounds, 6032 strengthened rows, 0 substitutions\n",
      "Cgl0003I 0 fixed, 0 tightened bounds, 1132 strengthened rows, 0 substitutions\n",
      "Cgl0003I 0 fixed, 0 tightened bounds, 51 strengthened rows, 0 substitutions\n",
      "Cgl0004I processed model has 6116 rows, 885 columns (885 integer (885 of which binary)) and 19224 elements\n",
      "Coin3009W Conflict graph built in 0.010 seconds, density: 0.517%\n",
      "Cgl0015I Clique Strengthening extended 0 cliques, 0 were dominated\n",
      "Cbc0045I Nauty: 8532 orbits (9 useful covering 18 variables), 3 generators, group size: 8 - sparse size 60510 - took 0.023144 seconds\n",
      "Cbc0038I Initial state - 885 integers unsatisfied sum - 176.897\n",
      "Cbc0038I Pass   1: (0.59 seconds) suminf.   59.27677 (226) obj. -4722.4 iterations 1553\n",
      "Cbc0038I Pass   2: (0.62 seconds) suminf.   39.57341 (110) obj. -4233.73 iterations 196\n",
      "Cbc0038I Pass   3: (0.63 seconds) suminf.   32.58399 (166) obj. -4110.58 iterations 114\n",
      "Cbc0038I Pass   4: (0.64 seconds) suminf.   30.07545 (153) obj. -3853.71 iterations 91\n",
      "Cbc0038I Pass   5: (0.66 seconds) suminf.   15.34659 (46) obj. -3419.75 iterations 215\n",
      "Cbc0038I Pass   6: (0.66 seconds) suminf.   14.65842 (44) obj. -3408.05 iterations 22\n",
      "Cbc0038I Pass   7: (0.67 seconds) suminf.    8.81896 (29) obj. -3227.2 iterations 65\n",
      "Cbc0038I Pass   8: (0.67 seconds) suminf.    8.81896 (29) obj. -3227.2 iterations 5\n",
      "Cbc0038I Pass   9: (0.67 seconds) suminf.    2.91509 (6) obj. -3099.05 iterations 42\n",
      "Cbc0038I Pass  10: (0.68 seconds) suminf.    2.80754 (7) obj. -3073.02 iterations 4\n",
      "Cbc0038I Pass  11: (0.68 seconds) suminf.    1.40566 (3) obj. -3192.66 iterations 7\n",
      "Cbc0038I Pass  12: (0.68 seconds) suminf.    1.40566 (3) obj. -3192.66 iterations 0\n",
      "Cbc0038I Pass  13: (0.68 seconds) suminf.    0.97170 (2) obj. -3097 iterations 3\n",
      "Cbc0038I Pass  14: (0.68 seconds) suminf.    0.93711 (2) obj. -3097 iterations 2\n",
      "Cbc0038I Pass  15: (0.69 seconds) suminf.   16.51243 (52) obj. -2728.2 iterations 236\n",
      "Cbc0038I Pass  16: (0.70 seconds) suminf.    4.47624 (12) obj. -2698.43 iterations 176\n",
      "Cbc0038I Pass  17: (0.71 seconds) suminf.    4.21425 (12) obj. -2698.43 iterations 3\n",
      "Cbc0038I Pass  18: (0.71 seconds) suminf.    0.33659 (2) obj. -2981 iterations 15\n",
      "Cbc0038I Solution found of -2981\n",
      "Cbc0038I Before mini branch and bound, 0 integers at bound fixed and 0 continuous\n",
      "Cbc0038I Full problem 6116 rows 885 columns, reduced to 6116 rows 885 columns - 48 fixed gives 1742, 486 - ok now\n",
      "Cbc0038I Full problem 6116 rows 885 columns, reduced to 1742 rows 486 columns\n",
      "Cbc0038I Mini branch and bound improved solution from -2981 to -3630 (2.18 seconds)\n",
      "Cbc0038I Round again with cutoff of -3838.9\n",
      "Cbc0038I Pass  19: (2.19 seconds) suminf.   59.27677 (226) obj. -4722.4 iterations 0\n",
      "Cbc0038I Pass  20: (2.21 seconds) suminf.   39.57341 (110) obj. -4233.73 iterations 250\n",
      "Cbc0038I Pass  21: (2.23 seconds) suminf.   32.77974 (165) obj. -3899.64 iterations 128\n",
      "Cbc0038I Pass  22: (2.23 seconds) suminf.   30.16831 (164) obj. -3867.33 iterations 20\n",
      "Cbc0038I Pass  23: (2.26 seconds) suminf.   17.22610 (60) obj. -3838.9 iterations 304\n",
      "Cbc0038I Pass  24: (2.27 seconds) suminf.   16.61995 (57) obj. -3838.9 iterations 117\n",
      "Cbc0038I Pass  25: (2.28 seconds) suminf.   16.26967 (55) obj. -3838.9 iterations 101\n",
      "Cbc0038I Pass  26: (2.29 seconds) suminf.   16.21096 (54) obj. -3838.9 iterations 64\n",
      "Cbc0038I Pass  27: (2.30 seconds) suminf.   14.08302 (45) obj. -3838.9 iterations 143\n",
      "Cbc0038I Pass  28: (2.31 seconds) suminf.   13.92785 (46) obj. -3838.9 iterations 83\n",
      "Cbc0038I Pass  29: (2.32 seconds) suminf.   11.83120 (38) obj. -3838.9 iterations 92\n",
      "Cbc0038I Pass  30: (2.32 seconds) suminf.   11.83118 (38) obj. -3838.9 iterations 8\n",
      "Cbc0038I Pass  31: (2.33 seconds) suminf.    9.85603 (28) obj. -3838.9 iterations 101\n",
      "Cbc0038I Pass  32: (2.33 seconds) suminf.    9.85226 (27) obj. -3838.9 iterations 27\n",
      "Cbc0038I Pass  33: (2.33 seconds) suminf.    9.85226 (27) obj. -3838.9 iterations 0\n",
      "Cbc0038I Pass  34: (2.34 seconds) suminf.   10.66830 (27) obj. -3838.9 iterations 126\n",
      "Cbc0038I Pass  35: (2.34 seconds) suminf.   10.29270 (28) obj. -3838.9 iterations 66\n",
      "Cbc0038I Pass  36: (2.35 seconds) suminf.    9.50845 (30) obj. -3838.9 iterations 34\n",
      "Cbc0038I Pass  37: (2.35 seconds) suminf.    9.50845 (30) obj. -3838.9 iterations 4\n",
      "Cbc0038I Pass  38: (2.36 seconds) suminf.   10.14960 (27) obj. -3838.9 iterations 125\n",
      "Cbc0038I Pass  39: (2.36 seconds) suminf.   10.14960 (27) obj. -3838.9 iterations 42\n",
      "Cbc0038I Pass  40: (2.37 seconds) suminf.   10.14960 (27) obj. -3838.9 iterations 2\n",
      "Cbc0038I Pass  41: (2.37 seconds) suminf.   10.14960 (27) obj. -3838.9 iterations 10\n",
      "Cbc0038I Pass  42: (2.37 seconds) suminf.   10.32496 (27) obj. -3838.9 iterations 67\n",
      "Cbc0038I Pass  43: (2.38 seconds) suminf.   10.32230 (27) obj. -3838.9 iterations 23\n",
      "Cbc0038I Pass  44: (2.38 seconds) suminf.    9.86035 (27) obj. -3838.9 iterations 50\n",
      "Cbc0038I Pass  45: (2.38 seconds) suminf.    9.86035 (27) obj. -3838.9 iterations 7\n",
      "Cbc0038I Pass  46: (2.39 seconds) suminf.   10.58182 (28) obj. -3838.9 iterations 92\n",
      "Cbc0038I Pass  47: (2.40 seconds) suminf.   10.12690 (29) obj. -3838.9 iterations 39\n",
      "Cbc0038I Pass  48: (2.40 seconds) suminf.   10.12690 (29) obj. -3838.9 iterations 5\n",
      "Cbc0038I No solution found this major pass\n",
      "Cbc0038I Before mini branch and bound, 0 integers at bound fixed and 0 continuous\n",
      "Cbc0038I Full problem 6116 rows 885 columns, reduced to 6116 rows 885 columns - 117 fixed gives 1084, 325 - ok now\n",
      "Cbc0038I Full problem 6116 rows 885 columns, reduced to 1084 rows 325 columns\n",
      "Cbc0038I Mini branch and bound improved solution from -3630 to -3696 (3.10 seconds)\n",
      "Cbc0038I Round again with cutoff of -4213.12\n",
      "Cbc0038I Pass  48: (3.11 seconds) suminf.   59.27677 (226) obj. -4722.4 iterations 0\n",
      "Cbc0038I Pass  49: (3.13 seconds) suminf.   39.57341 (110) obj. -4233.73 iterations 250\n",
      "Cbc0038I Pass  50: (3.15 seconds) suminf.   33.88853 (170) obj. -4213.12 iterations 151\n",
      "Cbc0038I Pass  51: (3.16 seconds) suminf.   31.43463 (182) obj. -4213.12 iterations 41\n",
      "Cbc0038I Pass  52: (3.16 seconds) suminf.   31.43463 (182) obj. -4213.12 iterations 0\n",
      "Cbc0038I Pass  53: (3.17 seconds) suminf.   27.47502 (179) obj. -4213.12 iterations 96\n",
      "Cbc0038I Pass  54: (3.19 seconds) suminf.   24.43690 (76) obj. -4213.12 iterations 127\n",
      "Cbc0038I Pass  55: (3.23 seconds) suminf.   26.23399 (166) obj. -4213.12 iterations 260\n",
      "Cbc0038I Pass  56: (3.23 seconds) suminf.   24.94531 (165) obj. -4213.12 iterations 46\n",
      "Cbc0038I Pass  57: (3.24 seconds) suminf.   24.94531 (165) obj. -4213.12 iterations 12\n",
      "Cbc0038I Pass  58: (3.28 seconds) suminf.   25.13837 (170) obj. -4213.12 iterations 283\n",
      "Cbc0038I Pass  59: (3.28 seconds) suminf.   24.65596 (169) obj. -4213.12 iterations 29\n",
      "Cbc0038I Pass  60: (3.31 seconds) suminf.   25.09872 (161) obj. -4213.12 iterations 227\n",
      "Cbc0038I Pass  61: (3.39 seconds) suminf.   47.63422 (212) obj. -4213.12 iterations 620\n",
      "Cbc0038I Pass  62: (3.42 seconds) suminf.   30.72558 (135) obj. -4213.12 iterations 344\n",
      "Cbc0038I Pass  63: (3.43 seconds) suminf.   30.72162 (136) obj. -4213.12 iterations 19\n",
      "Cbc0038I Pass  64: (3.43 seconds) suminf.   30.72162 (136) obj. -4213.12 iterations 1\n",
      "Cbc0038I Pass  65: (3.49 seconds) suminf.   47.98393 (194) obj. -4213.12 iterations 536\n",
      "Cbc0038I Pass  66: (3.52 seconds) suminf.   29.55003 (126) obj. -4213.12 iterations 289\n",
      "Cbc0038I Pass  67: (3.52 seconds) suminf.   28.72229 (131) obj. -4213.12 iterations 40\n",
      "Cbc0038I Pass  68: (3.53 seconds) suminf.   28.48900 (132) obj. -4213.12 iterations 42\n",
      "Cbc0038I Pass  69: (3.54 seconds) suminf.   28.21053 (132) obj. -4213.12 iterations 12\n",
      "Cbc0038I Pass  70: (3.55 seconds) suminf.   26.09815 (119) obj. -4213.12 iterations 86\n",
      "Cbc0038I Pass  71: (3.56 seconds) suminf.   25.81548 (118) obj. -4213.12 iterations 50\n",
      "Cbc0038I Pass  72: (3.56 seconds) suminf.   25.91101 (114) obj. -4213.12 iterations 56\n",
      "Cbc0038I Pass  73: (3.57 seconds) suminf.   25.64265 (122) obj. -4213.12 iterations 71\n",
      "Cbc0038I Pass  74: (3.58 seconds) suminf.   25.41765 (124) obj. -4213.12 iterations 43\n",
      "Cbc0038I Pass  75: (3.58 seconds) suminf.   25.41765 (124) obj. -4213.12 iterations 10\n",
      "Cbc0038I Pass  76: (3.59 seconds) suminf.   25.32540 (120) obj. -4213.12 iterations 37\n",
      "Cbc0038I Pass  77: (3.59 seconds) suminf.   25.32540 (120) obj. -4213.12 iterations 18\n",
      "Cbc0038I No solution found this major pass\n",
      "Cbc0038I Before mini branch and bound, 0 integers at bound fixed and 0 continuous\n",
      "Cbc0038I Full problem 6116 rows 885 columns, reduced to 6116 rows 885 columns - 117 fixed gives 1084, 325 - ok now\n",
      "Cbc0038I Mini branch and bound did not improve solution (3.92 seconds)\n",
      "Cbc0038I After 3.92 seconds - Feasibility pump exiting with objective of -3696 - took 3.54 seconds\n",
      "Cbc0012I Integer solution of -3696 found by feasibility pump after 0 iterations and 0 nodes (3.92 seconds)\n",
      "Cbc0030I Thread 0 used 0 times,  waiting to start 0.03910017, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 1 used 0 times,  waiting to start 0.037729263, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 2 used 0 times,  waiting to start 0.035860777, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 3 used 0 times,  waiting to start 0.034235954, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 4 used 0 times,  waiting to start 0.032502174, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 5 used 0 times,  waiting to start 0.030632496, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 6 used 0 times,  waiting to start 0.028613806, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 7 used 0 times,  waiting to start 0.026712656, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 8 used 0 times,  waiting to start 0.024844408, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 9 used 0 times,  waiting to start 0.022599936, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 10 used 0 times,  waiting to start 0.020697594, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 11 used 0 times,  waiting to start 0.018942833, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 12 used 0 times,  waiting to start 0.016968012, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 13 used 0 times,  waiting to start 0.015091896, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 14 used 0 times,  waiting to start 0.013318777, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 15 used 0 times,  waiting to start 0.01146841, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 16 used 0 times,  waiting to start 0.009449482, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 17 used 0 times,  waiting to start 0.0075492859, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 18 used 0 times,  waiting to start 0.0057370663, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Thread 19 used 0 times,  waiting to start 0.0037910938, 0 cpu time, 0 locks, 0 locked, 0 waiting for locks\n",
      "Cbc0030I Main thread 0 waiting for threads,  1 locks, 1.4305115e-06 locked, 4.7683716e-07 waiting for locks\n",
      "Cbc0011I Exiting as integer gap of 2014 less than 1e-10 or 50%\n",
      "Cbc0001I Search completed - best objective -3696, took 0 iterations and 0 nodes (3.96 seconds)\n",
      "Cbc0035I Maximum depth 0, 0 variables fixed on reduced cost\n",
      "Total time (CPU seconds):       4.17   (Wallclock seconds):       4.19\n",
      "\n"
     ]
    }
   ],
   "source": [
    "model = min_vertex_k_cut.trisect_connected_graph(coarsed_main_component, part_min_frac=0.15, emphasis=1, max_mip_gap=0.5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<OptimizationStatus.OPTIMAL: 0>"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.status"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[2014 1978  860  858]\n"
     ]
    }
   ],
   "source": [
    "split = min_vertex_k_cut.process_trisect_results(model, coarsed_main_component, main_component, node_to_cluster)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "first_idx = []\n",
    "second_idx = []\n",
    "third_idx = []\n",
    "\n",
    "for S_idx, partition in enumerate(split):\n",
    "    G_idx = new_nodes_to_old[S_idx]\n",
    "    if partition == 0:\n",
    "        first_idx.append(G_idx)\n",
    "    if partition == 1:\n",
    "        second_idx.append(G_idx)\n",
    "    if partition == 2:\n",
    "        third_idx.append(G_idx)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "for component in small_components:\n",
    "    i = np.argmin([len(first_idx), len(second_idx), len(third_idx)])\n",
    "    if i == 0:\n",
    "        first_idx.extend(component)\n",
    "    if i == 1:\n",
    "        second_idx.extend(component)\n",
    "    if i == 2:\n",
    "        third_idx.extend(component)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[1978, 1138, 1147]"
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "[len(first_idx), len(second_idx), len(third_idx)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [],
   "source": [
    "part_first = kdr_hi.iloc[first_idx]\n",
    "part_second = kdr_hi.iloc[second_idx]\n",
    "part_third = kdr_hi.iloc[third_idx]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<matplotlib_venn._common.VennDiagram at 0x7fe9633539a0>"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAgMAAADxCAYAAABWHrRsAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAsMklEQVR4nO3deXST550v8K9kWZb3fcUbxmzGYUmIWZvEbQIhkKW0KdDpTdOTdDKdtMmkuaHcaee0k545c5vcm2mztDO5oUN6S5JbWnIaYCCQEBKWEHYSVtuAbcCrbORNtmVL7/3jiQGDF9mW9Dzv+34/5+g4tmzph/P41VfPatE0TQMRERGZllV2AURERCQXwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZkcwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZkcwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZkcwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZkcwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZmcTXYB5CefD3C7gY4O8bHvdv3nHo/4vr6bpgEWC2C1Xrs5HEBUVP9bdHT/zy0W2f9aIiIKIYumaZrsIugGXi/Q1AQ4nUBjo/h45Yp4gQ+2sDAgORlISQFSU8UtIUEECSIiMiSGARW0tgKXLoX+hd9f1weEtDQgO1v0IBARkSEwDMigaUBDA1BVBVRWAi6X7IpGLi0NyMsTt6Qk2dUQEdEYMAyESm+vePdfWQlUVwNdXbIrCpzY2GvBIDOTQwpERDrDMBBs9fXAqVPA+fNiLoDR2e3AxInAtGlirgERESmPYSAYenuBigoRApxO2dXIk5UFFBUB+fnsLSAiUhjDQCC5XCIAlJWJZX4kREUBU6eKGyceEhEph2EgEOrrgUOHgMuXZVeiNqsVGD8euO02DiEQESmEYWAsrlwBDhwQqwLIfxYLMHmyCAXR0bKrISIyPYaB0WhvFz0B5eVimSCNTlgYUFwMzJwJRETIroaIyLQYBkaiqws4elTMCzDDyoBQsdtFICguBmzcIZuIKNQYBvyhacAXXwCHDwM9PbKrMa6oKGDePGDCBNmVEBGZCsPAcFpagF27xCRBCo3x44GFC4HISNmVEBGZAsPAYPp6Aw4dEvsGUGg5HMCCBewlICIKAYaBgbA3QB3sJSAiCjqGgeuxN0BN7CUgIgoqhoE+3d3Ahx+Kw4RITVOmiF4Cbm1MRBRQDAOA2EZ42zagtVV2JTScjAzgnns4bEBEFEAMA9XVwM6dPEtAT2JigEWLgJQU2ZUQERmCucPAsWPAwYPcRVCPbDbgrruAggLZlRCRn3p7AbdbvPfy+cQNEDuUW61iU1KHQ3T8WSxyazUbc4YBrxf4+GNxzDDp26xZwO23y67CFHyaD82dzWjpaoG7x93v1tHTga7eLnh9XmjQ4NN8sMACi8UCq8UKe5gd0eHRiAqP6neLsccgJSoFETZuR20Ura1AYyPQ1CR2bne7r9387YC1WEQgiIoSt+hoID5edAampIhNSymwzBcGurqArVtFayVjyM8HvvY18baCAqLvhd/pdqKxoxFOtxPNnc3wasHZhjvWHouUqBSkRqeKj1GpDAg60NUF1NSIy2ljI+B0hmbENS4OSE0VwSA9XdzYkzA25goDbjewZYs4bZCMJTtbzCPg2Qaj1tXbheqWalS5qnCp9RJ6fHK33k6JSkF+Qj7y4vOQHJUstRa6xuUCKivFYa0NDWqMskZEADk54n1BdjZ7DkbDPGGgowPYvFlsKETGlJkJ3HsvEB4uuxLdaOlqQaWrElUtVahvr4cGNS8HMfYY5MXnIS8hD+Nix8HCt4Eh5XSKQ1qrqtRfdGW1AllZIhgUFjIY+MscYaC9Hdi0CWhrk10JBVt6OnDffQwEQ/BpPlS6KnGq8RRq2mpklzNi0eHRmJo6FVNSpiAqPEp2OYbl9QLnzolDWhsaZFczOjabCATTpgHJ7FwakvHDgNsNvPee+nGWAicjQwQCDhn00+HpwGnnaZxxnoG7xy27nDGzWqzIT8hHUWoRsmKzZJdjGK2twOnTwNmzYk6AUaSliVBQUMDpRQMxdhjo7BQ9Ai6X7Eoo1LKygCVL+FcPMRRwqOYQLrguwKf5ZJcTFImORNyaeSsmJHHL6tFqbRU7sZ87p8Y8gGCJjARuvRWYOpWbmV7PuGHA4xE9As3NsishWXJzxaRCk/7Fu3vcOFRzCGVNZYYNATdKiUpBybgSZMdlyy5FNzo7gSNHRG+AzxzNBIBYkTB7thhGIKOGAU0T2wtfvCi7EpKtuBiYP192FSHV3duNY3XHcLLxJHp95jxwKys2CyXjSpAWnSa7FGV5PMDnn4ubmc9lS04GSkrEagQzM2YY2L9ftHAiALjjDnHIkQmcajyFA5cPwOPl9toAMCFxAubnzEdkOM+yuN7588DevaJXgITcXOArXxEbHJmR8cJAWRmwa5fsKkglViuwbJmYWGhQbd1t+LjqY12uDgg2h82BBTkLOJ8AYkLgnj0iDNDN7HZg3jxg8mTZlYSescJAQ4OYMOgNzi5ppGORkcDXvy4OOTKYkw0n8dnlz0w7JOCv8QnjsTB3oWl7Cc6fF0HASCsEgiUnR3QomqmXwDhhoKMDePddsZSQaCApKcADDxhmySF7A0bOjL0E3d3A7t3sDRgpu11MN5o0SXYloWGMMOD1ipUDPG+AhlNQANx9t+wqxuxS6yV8cP4Dzg0YpaLUIszPmQ+rxdgrTa5cAd5/n9usjEVRkQgFRl+UZIwwsHu3WBdD5I9584BbbpFdxah9Xv85Prv0mbJbB+tFVmwW7i64Gw6bQ3YpQVFVBezcCfTIPWLCELKyxHsIhzGbCgAjhIFLl4D/+i/ZVZCe2GzAN74hzkTVEa/Pi93Vu1HWVCa7FMOItcdiceFiJEUmyS4loI4eFRsI6fzqrpTYWGDxYiDJWE3lKn2HgZ4eYMMGcfYA0UhkZAD336+bc0/dPW5sP7cdDR063SReYeHWcJSOL0V+Qr7sUsbM6xWLqc6dk12JMYWHA1/9KpCXJ7uSwNP3KMj+/QwCNDp1dcCJE7Kr8Etrdyv+euavDAJB0uPrwfZz23G6Ud9Djb29wNatDALB1NMDbN8uVrAbjX7DwKVLnCdAY3PwoPIzq1q6WrDp7Ca0eXjiZrDtrt6NEw36CIg38njEaGkNF5YEnaaJ3pczZ2RXElj6DAM9PcAnn8iugvSut1f8VSs6UubqcmFT2SZ09HTILsU09l3ch8/r9bV7aU+PCAJ1dbIrMZdPPjHW+1F9hgEOD1CgKDpc0Nrdii1lWwxx1LDe7L+0HycbTsouwy+9veIYlgaOIEmxe7dxhgz0Fwbq6owVx0i+gwfFplWK6PB0YHPZZvYISLT34l6cdZ6VXcaQfD4xfl1bK7sSc/v4Y2Ns6KS/MPDZZ7IrIKPp7QUOH5ZdBQCg19eL98+9j3YPe75k2129G7Vt6r7S7tsnpk6RXH1zCJxO2ZWMjb7CQFUVUF8vuwoyorNnAZdLdhX4uPJjON06v6oYhE/zYcf5HWjrVm/y5unTwKlTsqugPr29opdGz6dA6icMaJroziUKBgXa19Haozh3hevCVNLV24X3z72v1CFQtbXi+GFSS3s7sGOHGL7RI/2EgfJyoLlZdhVkZBcuSJuJVeWqwsEahl0VNXc246MLH8kuA4D+X3CMrq5OnAypR/oIA16v2FuTKNgOHAj5U7q6XNh5YWfIn5f8d8F1AYdr5M4r8XrFoUM8glhtZ87ocwhHH2Hg1CkuJaTQqKkBLl4M2dP5NB8+uvARenw8TUZ1R2qPSN0F8vBhoKlJ2tPTCOzfr/x+ZjdRPwz09IhTN4hCJYS9A8frjqPRzaO39UCDhl2Vu+D1eUP+3A0NwPHjIX9aGqW+/cz0RP0wUFbGfjEKraYm4PLloD/Nlc4rOFyrxpJG8o+ryxXy/2d9hw8pulEmDULR/cwGpX4Y0OPgC+lfkNudT/NhV+Uu+DTOBNOb43XHQzpccPiwEqteaRQOHNDPcIHaYaCmBrhyRXYVZEZVVUHdlZDDA/oVyuECDg/om+LHn/SjdhhgrwDJ4vMFbdvrdk87jtQeCcpjU2i4ulz4ouGLoD/Pvn36eCGhwdXVARUVsqsYnrphwO0GKitlV0FmduZMUBZ0H645DK8W+kloFFjH6o6hu7c7aI8vcdsLCrBDh9TfG0LdMBCkCzGR34IQSK90XkFZk0GOOTM5j9eDY3XHgvLYCmyISQHU1qZ+R7eaYSCIXbREIxLgv+CDNQehgf2+RnGi4QQ6PIGfW6LIURkUQEePipXyqlIzDFRXK3WkLJlYTU3ArsoNHQ2odFUG5LFIDV7NG/Clhl6vModoUgB1dgJfBH+ayaipGQYuXJBdAdE1ARoqOHA59FsdU/CddZ6Fq8sVsMc7dYrvhYzq+HGgO3jTTMZEvTCgaSHdDpZoWAEIA063EzVtNWOvhZSjQcOJhsDsLqNp+tqohkamp0cMAalIvTBQV8cdB0ktjY1jPqj8VKPis4doTMqbytHjHfuA8MWLYrIZGZeqEwnVCwNVVbIrIOpP08Q8llHyeD2oaNbBQmMatR5fD8qby8f8OCdPBqAYUlprq5qd3wwDRP4YQ7s86zyLXl9vAIshFY2196e1Fbh0KUDFkNJU7B1QKwy4XEBLi+wqiG526ZKY5j0KHCIwh+bOZtS1143650+f5m6DZlFdDbS3y66iP7XCAHsFSFW9vaM6ybCmrQYt3Qy4ZjHa4OfzqTuxjAJP09TbSketMDCGcVmioBtFWD1/5XwQCiFVVbmqRnWAUW0t502bjWor6NUJAz4fN+ImtdXXj/hHqlzs7TKTHl8PattrR/xz7BQ1H5dLreON1QkDLteox2SJQuLKFTFc4Cen24mOHu4eYzaj2WWSYcCcVDqLT50w0Miz3UlxmgY0N/v97ewVMKfqlpENdzY3c28Bs1IpBKoTBpxO2RUQDW8EobWqRaG/dAqZdk87nG7/r2cqvTuk0KqvV2d7YnXCAHsGSA/8DK0dno4RvSCQsYykd4Dzps3L51NnAyI1woDPN6LuVyJp/AytY1lvTvrn7/9/r5edomZXp8ilQo0w4HKNaGIWkTR+TiJkr4C5NXb4FxqbmsR7ITIvVcKgGmGAQwSkF35OImx0s02bWbe3G23dw88KVOWFgORRJRCqEQa4BTHpics17LewZ4D8CYR8H0Rer+hwlE2NMNDBtdikI273kHe3drfC4/WEqBhSlT+BkD0DBKjRDtQIA8NcXImUMkx49Xe8mIxtuDCgyjtCkk+FHiKGAaKRGqa9urpcoamDlHalc+hX+tZWNcaKST4/Rh6DTo0wwGEC0pNhwgC3ICYA6OzthDbEmcS87FEfFd4Pyw8DXi/g4fgq6cgwf7nuHgX+skk6n+ZDV+/gRxGq8AJAalChLcgPA4zHpDcMA+SnodqCCi8ApAaPR/5WOza5Tw/+RQzhk7IyvLh9Ow5XV6O2pQXv/uAHeGjmzKv317e24icbN2L7qVNwud24Y+JEvLJyJSampwMAKp1OjP/pTwd87D/97d/i4dtuAwAcrKzEmo0bcbi6GhaLBSX5+Xhh+XLMyMkJ+r9Rl7xesaF4RMSAdxslDJQdKcP2/7sd1aer0eJswQ/+1w8w866ZV+8/svMIPvnLJ6g+U42Olg78bP3PkDO5f5v547/8EacPnEaLswURkRGYMH0Clj+1HBn5GVe/p/JkJTa+uhHVp0X7y5+Wj+VPLUfOJP23v46eDiQjecD7jHLpKyv7BNu3v4jq6sNoaanFD37wLmbOfOjq/UeObMQnn/w7qqsPo6OjGT/72VHk5Mwc8LE0TcMrr9yHkye39XucffvW4c03vzfgz7z4Yj3i4tIC/K8KPbcbiIuT9/zyewY6O2VXoKwOjwczsrPx2qpVN92naRoe+u1vcb6xEX/9+7/H0Z/9DHnJybj7179Gx5cnX+QkJaH2hRf63f75/vsRExGBJdOmAQDau7pw78svIzcpCZ+tWYM9zz2HWIcDi19+GT08Unpwg7RbTdPQ2WOMNu3p9CB7YjZW/eTm9td3f+HMQiz/0fJBHyN3ai6++/Pv4hcbfoGnX30amqbh10/+Gj6vmDnX5e7Cy0+9jKSMJKxZtwbPvfEcHFEOvPyjl+Ht1X/7M0PPgMfTgezsGVi16rVB7y8sXIjly3817GN9+OGvYbFYbvr67Nkr8MILtf1uRUWLMWnSnYYIAoD89iC/Z4AvOINaUlyMJcXFA95X3tCA/Rcu4MTPf45pWVkAgN99+9vIWL0abx88iMcXLkSY1YqM+Ph+P/fusWP41uzZiHE4AABn6urQ3NGB5x94ADlJSQCAny9bhunPP4+qpiYUphnjDy3gBunT6+rtgobBJ43pSfGCYhQvGLj9AcDcpXMBAM6awZfQ3bH8jmufZAEP/v2D+OWqX6Kptgmp2amoq6xDR0sHHnjiASRliPa37G+X4fmVz6OptglpOfpuf0MFQ9kX/0ApLl6C4uIlg94/d+5/AwA4nZVDPs7Fi8ewY8f/xj/+4yGsXp3Z7z67PRJ2e+TVz9vaGnH27E488sja0ReuGNntQX7PANfWjEr3ly9GjvDwq1+zWq2IsNmwp6JiwJ85XFWFYxcv4rEFC65+bXJGBpKjo7F27154envR6fFg7Z49mJqZifzkgbs3CWJb4gH0+njGxmC6O7ux7719SBmXgsT0RABARl4GouOjsfeve9Hb0wtPlwd7/roHmeMzkZyp//bn1QZ/s8P3Qdd4PG6sXfttrFr1GuLjM4b9/v37/wC7PQq33vrNEFQXGrLbg/yeAYaBUZmSkYHcpCT8j3ffxX/8zd8gOiIC//bBB7h05QpqB9neee3evZiamYn5EyZc/Vqsw4Fdzz6Lh373O/xyyxYAwMS0NLz/9NOwhYWF5N+iS4O0W6P0CgTSrg27sPHljeju7EZ6Xjr+4bV/gC1cXHoc0Q48+x/P4nf//XfYsla0v7ScNDz96tMIs+m//fm0wa9vvPRd86c/PYOCgvmYOfNBv75/7961KCn5dr/eAr2T3R7k9wwMsQ6XBhceFoaNf/d3KKuvR9KPf4yoH/0IH509iyXFxbAOMObW6fHgrQMH+vUK9H39sT/8AQsmTMD+NWuwd/VqFI8bh6WvvopOLvkc3CB/uUNd/M1qzpI5+On6n+LZ159Fem46Xl/zOnq6ewAAni4P/vDLP2DCjAlY859rsHrtaoybMA6vPv0qPF36b39DtQde+oTjx9/D2bM78a1v/dqv7z937lPU1p7GggWPBbewEJMdBuT3DNCo3ZaXh2P/9E9o6eyEp7cXqbGxmPOv/4rZeXk3fe+fjxyB2+PBI3Pn9vv6WwcOoLKpCZ/+5CewWkU2fOuxx5D4zDP46/HjWHn77SH5t+jOAIGLBhYZE4nImEik56aj4JYCPFP6DI5+dBQl95bgwLYDaKptwk/+81r7e+xfHsMzpc/g+MfHcftitj+jO3NmJxobz+GZZxL6ff3f//0bmDjxK3j22V39vr537xvIyZmJvLzbQlZjKMi+pMgPA1b5nRN6Fx8pusrK6+txqKoKv3zw5q62tXv34oEZM5AaG9vv626PB1aLpd8M3r7PfXzrMrhB/nKtFrbnoWiaBk3T0Nsj5lZ4ujyw3ND++j4favc+vRiqPfDSJ9x77xosXPh4v689//wt+Na3/g3Tp9/f7+tdXe04dOhP+PrX/zWUJYaE7PbAMKCw9q4uVFx3gsUFpxPHLl5EUnQ0cpOSsOHwYaTGxCA3KQlfXL6Mp//0Jzw0cyYWFRX1e5yKhgZ8Ul6O//rhD296jnuKivDcX/6CJ99+Gz8qLYVP0/A/t22DzWpF6eTJQf836tYg7dZIYaDL3YXGi9fan/OyExfPXkR0fDSSMpLQ0dKB5rpmuBpdAIC6qjoAQFxyHOJT4tF4qRGHdhxC0dwixCbG4kr9FWxbtw12h/3qKoWiuUX4y8t/wdu/ehulK0qh+TRsW7cN1jArJs/Wf/sbqj3IficYKF1d7WhsvDZp2em8gIsXjyE6OglJSbno6GhGc3M1XK4aAEBd3VkAQFxcBuLjr91ulJSUi5SU8f2+dujQ/4PP14s5c74TxH+RHLLbg/wwIPs3oLBDVVUofemlq5//eMMGAMB3583DukcfRW1LC368YQPqW1uRGR+PR+bOxT8tXXrT4/x+715kJyTcFBIAMRFx05NP4p83b8a8X/0KVosFs3JysO2pp5B5w7JEus4gYcBmlf8nFShVp6rw0t9da38b/k20v3nL5uHRXzyK458cx5v//ObV+9/4xzcAAMu+vwz3P3E/wiPCUXG0Ah++/SHcrW7EJcdh4qyJWL12NeKSxO4qGfkZePKlJ7H5/2zGr773K1isFuRMzsFTrzyF+BT9t79wa/jg9w1+l65UVR3CSy+VXv18w4YfAwDmzfsuHn10HY4ff6/fhkFvvLESALBs2c9x//2/GNFz7d27FrNmLUdUVMKY61aN7PZg0WT3xVVVAe+/L7UEohFbsQIYJCy9ceQNTiQkAEBpfikmJk8c8L6dO4FBVgGTCT30ECBzWxf5fZpRUbIrIBq5IdptVDjbNAlDtQVe+uh6stsDwwDRSIWHD9mnxzBAfRgGyF+y24P8MBAZyXkDpC/D/NUyDFAfhgHyh8Mhfy69/DBgtYrfBJFeREcPfXf40PeTOYRZwhBhG/hkS2DYZkQmokIwlB8GADV+E0T+Gqa9Rtt5lafh2wHDAPVRoS2oEQZU+E0Q+WuYMJAUmRSiQkhlw7WD2FjAZpyVqDQGSQpcMtQIA+wZID0Zpr2mRqWGqBBS2XDtwGIBUlJCVAwpLVWBSwbDANFIDdNeI8MjOW+AkBo9/BWeYYAANdqBGmFAhT4SIn/50V5TohT46yap/GkDKrwjJLkiIoC4ONlVqBIG+BdBemGzAYmJw36bP+8Kybhi7DFw2IZfJaXCO0KSS5U2oEYYiI0V8YhIdcnJfu2LwZ4Bc/P3/39CAicRmh3DwI1U+Y0QDcXPXqyMmAxDnWBIIzMudpxf32exAJmZQS6GlJaVJbsCQZ2rFYcKSA/8DK32MDsyY3iVN6u8hDz/v9f/byWDCQ9nGLgZewZID0bQTkfygkDGkRyZjBh7jN/fzzBgXtnZQFiY7CoEdcIAewZIdX5OHuyTn5AfvFpIWSMNgdHRfC9kVioFQXXCACcRkur8nDzYJ8Yew90ITSgvfuRXeJVeFCg0LBYgN1d2FdeoEwYAzqQhtY2ifY7mhYH0Kyo8alTLShkGzCc9Xa0z+tQKA/yLIJWNon0WJhUGoRBS1Wj/f6ekAPHxAS6GlDZhguwK+lMrDOTmjqgblihkIiOBtLQR/1hiZCJXFZhIUWrR6H929D9KOmOzARMnyq6iP7XCwCgvuERBN4agOi1tWoCLIRVlx2UjLmL0+8pOnswNiMxi4kTAbpddRX9qhQGAQwWkpjG0y/yEfESF8zAuoxtLrwAgXhwKOapkCtMUfH/AMEA0nLAwsSB4lKwWK6akTAlgQaSaGHtMQCaLcqjA+DIy1DybT70wkJioxhFORH3GjRtz/+3UlKncntjApqRMgSUA851SUjhSanSqBj41r07sHSCVBKA9RtujubLAoOxhdkxLDVy/74wZAXsoUkxsLFBQILuKgakZBlRbc0HmZbUC48cH5KFmZ81GmEWRvUcpYGakz0CELXAbpo0fzw1ZjWr2bHFJUZGaZaWlcX9OUkNBQcB2Bomxx4x5khmpJSo8Crek3xLwx50zJ+APSZIlJak9QVTNMACoO7BC5hLgdjgrcxbsYYqtKaJRuzXzVtisgV8PmJU1pjmrpKCSErW30VE3DBQWqrcQk8wlOVlM/Q0gh82B6enTA/qYJEdcRFxQV4mUlATtoSnEMjLUOodgIOqGAZsNmDRJdhVkZkHqnZqePp37DhhAybiSoK4QSUnh9Cmj0EOwUzcMAGruzEDmYLcHbb9Qm9WGhbkLg/LYFBq58bkoSAz+tPB589hBqndTpgS8gzEo1A4D8fFijTdRqE2cGNS9YfMT8rnUUKciwiJwR94dIXmuqChg/vyQPBUFQUwMMHeu7Cr8o3YYANg7QHKEoN0tyFmASFtk0J+HAmtezryQDvNMmqT+eDMN7I479NOzo34YyMsTuxIShUp+PpCQEPSnibBF4Ct5Xwn681Dg5MbnYlJy6Ocy6elFhYQpU/S1IkT9MGCxALffLrsKMguLJaSzfThcoB+hHB64EYcL9EVPwwN91A8DgHinlp4uuwoyg0mTQtIrcL2FuQsRHxEf0uekkbsr/y6pq0AmTeLqAj2wWoHSUv315OgjDADckouCLywMuO22kD+tPcyOxYWLuRmRwm7Puh15CfLPTLnzTm7Oqrr584HMTNlVjJx+woAedm0gfZs2TfTvSZDgSMDXxn8NFii8RZlJFSQWYFbmLNllABALXBYtAiI571RJRUX63TxXP2EAUH8/R9Ivux2YJfeCnxOfg5JxOtidxERSolJwV/5dssvoJyZGBAJVD7wxq8xMfc/r0FdzSkrioBkFx4wZQETgTp4bdRkZMzAxKTibHdHIRNoisWjCoqCcPTBW6enAV7gQRRmxscA99+g7oOmv9NtvD+pmMGRCMTHALYE/eW607si7A9lxOlqTZED2MDvuLbwXMXY5w0b+mDwZmDlTdhXkcACLFwfscFNp9BcGYmP1sdEz6ccddygVMMOsYVg0YREyY3Q4C8kAwq3hWFK4BKnRqbJLGVZJiVI51nTsduC++0Sntd7pLwwAQHGxPjZ7JvUpujOIzWrDvYX3IiOG7TyUbFYbFhcuRnqMfpYyz5un30lretYXBIyyukOfYQAA7rpLqXdzpEOK7wwSHhaO+ybeh6zYLNmlmII9zK7b3/fCheI9EoVGRASwdCmQlia7ksDRbxiIi+NwAY2NDvZ47eshyInLkV2KoTlsDiyduFTXPTHz53MOQSg4HMCyZUCq+qNII2LRNE2TXcSYvPceUFcnuwrSmylTRBjQCU3TsP/SfnzR8IXsUgwnKTIJiyYsQlxEnOxSAuLUKWDfPsDnk12J8SQmismCccZoKv3oPwy0tgJ//jPQ2yu7EtKLmBjgm99UvldgIGedZ7G7ejd8Gq/0gZCfkI/S/FKEh4XLLiWgamqADz4AurpkV2IceXnAV78KhBurqVyl/zAAACdPAnv3yq6C9MBiAZYsUXLSoL/q2+ux4/wOuHvcskvRtVkZs3D7OOMegtbWBrz/PtDcLLsS/Zs1y/jn5RkjDADArl1AWZnsKkh1JSWGGFjt8HRg+7ntaHQ3yi5Fd2xWG+7MuxMTkoy/gVlPD/DRR0BlpexK9MlmE+dBmGGvO+OEAa8X2LQJaGiQXQmpqrBQ9PMZhE/z4UjtERyrO8ZhAz9lxmTizvw7DTM/wF8nTwKffcbR1JFITRWL1hITZVcSGsYJAwDgdgPvvgt0dMiuhFSTmgo88IA4mdBgmtxN2FW5C02dTbJLUZbNakPJuBIUp5l3/V1rK/Dxx0BtrexK1NZ3eOmMGeY6CsdYYQAAGhtFDwEjMPWJigK+/nUgOlp2JUHDXoLBmbU3YDDsJRic2XoDrme8MAAAFRXAzp2yqyAVhIUB999vrN1BhuB0O/HpxU9R2863f5G2SNyWdRuKUrk9341aW4E9e4BLl2RXoobwcDFJ0Gy9AdczZhgAgAMHgGPHZFdBst11FzBpkuwqQu5iy0UcuHzAlEMH4dZwzMiYgVvSbjHcksFAu3xZXCobTToP1WoVWznfeqv+DxoaK+OGAU0T02grKmRXQrLcdpu4mVhFcwUO1RxCa3er7FKCLswShqLUIszKnAWHzeRX9hE6fx44eBBoaZFdSWhYLGI+8ezZ4uw7MnIYAMQWXB9+CFy4ILsSCrWZM7ld9Zd8mg9nnGdwouEEXF0u2eUEXLg1HBOTJ2JmxkyljxxWnc8HnD0rOlTb2mRXExwWi9g8aPZsY5w0GEjGDgOAaOHbtwPV1bIroVApLhYbtdNNatpqcKrxFCpdlbqfaJjoSMS0tGmYmDSRwwEBpGnAxYtiW+OLF8XneudwiB3Ii4rEBqR0M+OHAUDsQbBjBwOBGUybBixYILsK5bl73DjdeBpnnGfQ0aOfpbhWixX5CfmYljoNmbGZsssxvLY24PRp4MwZfW5tnJ4uLgkFBWJ+AA3OHGEAED0EH3zArbiMbPp0pY8kVlVDRwOqXFWoaqlCc6d6e9dGhEUgNz4XeQl5yInLYS+ABF6vWHlQVSVunZ2yKxpcWpoYCsjPN+cSwdEyTxgARCD46CPg3DnZlVCgmWHz8BBo625DVUsVqluq0dDRAI/XE/IaLLAgMTIR2XHZyIvPQ0ZMBixmXe+lqIaGa8FA9tkHNhswbpwIALm5YlsRGjlzhQFADIDt2yd23iD9s1iAOXNErwAFXEtXCxrdjXC6nVdvgQwIfS/8KVEpSIlKQWpUKpKjkmGz2gL2HBRcnZ1iaaLTKT42NorNYIPBahXv9lNTgZQU8TEpyZAbi4ac+cJAn9OnxUmHPPRbv+x24GtfA3JyZFdiKu4e94C3zp5OeDUvNE2DT/PBYrHAarHCarHCHmZHVHjUTbfo8GiEWXklNxq3G2hqEjvDu93XPvbdPB5x6dU0cbNYxAu91QpERorNQqOi+t/i4/nCH0zmDQMAUFcnVhrocWaM2cXHA4sXAwkJsishItI9c4cBAGhvF4d+N5lvpzbdyskRPQJ2u+xKiIgMgWEAECd2fPQRNyfSg+nTxRwBTigjIgoYhoHrHTkCHD5sjF02jMZmAxYuNOU5A0REwcYwcKOGBmDXLsDlkl0J9cnMBO68E4jjEbRERMHAMDAQrxc4dAj4/HP2Eshks4nzBYqLZVdCRGRoDANDYS+BPOwNICIKGYaB4bCXILTYG0BEFHIMA/5qaAA+/RSor5ddiXHl5QHz5rE3gIgoxHiOk7/S0oAHHwQWLeLpF4GWkSF+t4sXMwjo2Lp162CxWPrd0tLSUFpaiq1bt8oujxRz7tw5PPHEEygoKIDD4UBcXBwWLFiA3/zmN+hU+SQkg+IG4COVny/ewZaViWWI7e2yK9KvpCQxJJCbK7sSCqDnn38e48ePh6ZpqK+vx7p163Dfffdh06ZNWLZsmezySAFbtmzBww8/jIiICDzyyCMoLi6Gx+PBnj178Nxzz+HkyZN4/fXXZZdpKgwDo2GxAJMnA4WF4sCjY8e4pfFIxMYCs2eL3x83DzKcJUuWYPbs2Vc/f+yxx5Ceno63336bYYBw4cIFrFy5Enl5edi5cycyMzOv3vfkk0+ioqICW7ZskVihOTEMjEVYmNgRb8oU4MQJcfhRR4fsqtSVkCAmBk6ZIk4kIVNISEhAZGQkbDZebgh44YUX0N7ejrVr1/YLAn0KCwvx9NNPS6jM3PjXGQh2O3DrrcDMmeKA71OngMuXZVelBqtVDK0UFQFZWbKroRBoaWmB0+mEpmloaGjAK6+8gvb2dnznO9+RXRopYNOmTSgoKMD8+fNll0LXYRgIJKsVGD9e3FwuEQrKysR5nWYTHS16AKZOFeePkmncfffd/T6PiIjA73//e9xzzz2SKiJVtLa24vLly3jwwQdll0I3YBgIloQEYP58MUGuokKEgvp6Y+9VEBYm3v1PmSImWXIowJRee+01TPryDIn6+nr88Y9/xOOPP47Y2FgsX75ccnUkU2trKwAgNjZWciV0I4aBYLPZxIvjlClikmF1tRhKuHQJ6OmRXd3YORxiNUBeHpCdDYSHy66IJCspKek3gXDVqlWYNWsWfvjDH2LZsmWw8+hp04r7culwW1ub5EroRgwDoeRwiFP3Jk0SOxvW1IhgUFWlr4mHCQnixT8vD0hP54oAGpLVakVpaSl+85vfoLy8HNOmTZNdEkkSFxeHrKwsnDhxQnYpdAOGAVnCwoCcHHFbuBC4cgVobAScTvGxqQno7ZVdpZgcmZoKpKSIj6mpYmkg0Qj0ftmW27kvh+ktW7YMr7/+Oj799FPMmzdPdjn0JYYBVSQmituXY63QNDEJsS8gOJ1igyO3G/D5Av/8NpuY6Bcbe+2FPyWFOwLSmPX09GD79u2w2+2YOnWq7HJIstWrV2P9+vV4/PHHsXPnTqSnp/e7/9y5c9i8eTOXF4YYw4CqLJabA0Kfri4RCq6/dXQA3d0iRPh84qZpYhKfxSI+Wq1iqCIqStyio6/9N8dxKUC2bt2KM2fOAAAaGhrw1ltvoby8HGvWrLk6ZkzmNWHCBLz11ltYsWIFpk6d2m8Hwn379mHDhg149NFHZZdpOjyoiIgCYt26dfje977X72sOhwNTpkzBE088gSeeeAIWzi+hL5WXl+PFF1/Ejh07UFNTg4iICEyfPh0rV67E97//fURERMgu0VQYBoiIiEyOC8GJiIhMjmGAiIjI5BgGiIiITI5hgIiIyOQYBoiIiEyOYYCIiMjkGAaIiIhMjmHAoH7729/CYrFgzpw5skshIiLFcdMhg1qwYAFqampQWVmJ8vJyFBYWyi6JiIgUxZ4BA7pw4QL27duHl156CampqVi/fr3skoiISGEMAwa0fv16JCYmYunSpfjmN7/JMEBERENiGDCg9evXY/ny5bDb7Vi1ahXKy8tx8OBB2WUREZGiGAYM5vDhwzhz5gxWrlwJAFi4cCGys7PZO0BERINiGDCY9evXIz09HaWlpQAAi8WCFStW4J133oHX65VcHRERqYhhwEC8Xi/eeecdlJaW4sKFC6ioqEBFRQXmzJmD+vp6fPjhh7JLJCIiBXFpoYHs2LEDixYtGvT+Rx55BG+++WYIKyIiIj1gGDCQRx99FFu3bsVrr712030bN27E5s2bUV9fj8jISAnVERGRqhgGDKKzsxPp6el4+OGHsXbt2pvu37dvHxYsWIB33nkHK1askFAhERGpinMGDOK9995DW1sbHnjggQHvnzt3LjcgIiKiATEMGMT69evhcDhwzz33DHi/1WrF0qVLsW3bNjQ1NYW4OiIiUhmHCYiIiEyOPQNEREQmxzBARERkcgwDREREJscwQEREZHIMA0RERCbHMEBERGRyDANEREQmxzBARERkcgwDREREJscwQEREZHIMA0RERCbHMEBERGRy/x/pgroZ6uNZRwAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "venn3([\n",
    "    set(part_first['smiles'].tolist()),\n",
    "    set(part_second['smiles'].tolist()),\n",
    "    set(part_third['smiles'].tolist()),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_1 = pd.concat([part_first, part_second])\n",
    "train_1 = part_third.copy()\n",
    "\n",
    "test_2 = pd.concat([part_first, part_third])\n",
    "train_2 = part_second.copy()\n",
    "\n",
    "test_3 = pd.concat([part_second, part_third])\n",
    "train_3 = part_first.copy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_1 = train_1[:500]\n",
    "train_2 = train_2[:500]\n",
    "train_3 = train_3[:500]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [],
   "source": [
    "min_vertex_k_cut.test_split(train_1['smiles'], test_1['smiles'], threshold=0.4)\n",
    "min_vertex_k_cut.test_split(train_2['smiles'], test_2['smiles'], threshold=0.4)\n",
    "min_vertex_k_cut.test_split(train_3['smiles'], test_3['smiles'], threshold=0.4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<matplotlib_venn._common.VennDiagram at 0x7fe963395e40>"
      ]
     },
     "execution_count": 27,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXsAAAGJCAYAAABrZJMZAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAABEc0lEQVR4nO3deXhc9X33/fc5Z+bMopnRvlreV7yyGcxyQ0xYAyQNTQJp9jZpytMmPEkgpXea3m3au3laruQupGlo2uaiaZyEwB0aUsoOIQFM2AIYgzHeN1mLJc1o9uWc548TC0sa25I8M78zM98Xly5sSdZ8tZyPfvM9v0WzbdtGCCFETdNVFyCEEKL8JOyFEKIOSNgLIUQdkLAXQog6IGEvhBB1QMJeCCHqgIS9EELUAQl7IYSoAxL2QghRByTshRCiDkjYCyFEHZCwF0KIOiBhL4QQdUDCXggh6oCEvRBC1AEJeyGEqAMS9kIIUQck7IUQog5I2AshRB2QsBdCiDogYS+EEHVAwr6M/umf/glN0zj33HNVlyKEq9x1111omjbhpaOjg40bN/Lggw+qLq8meVQXUMs2bdrEggULeP7559mxYwdLlixRXZIQrvK1r32NhQsXYts2/f393HXXXbznPe/h5z//Oddcc43q8mqKjOzLZPfu3Tz77LN885vfpL29nU2bNqkuSQjXueqqq/joRz/Kxz72MW6++WZ+9atf4fV6+dGPfqS6tJojYV8mmzZtorm5mauvvpoPfOADEvZCTENTUxOBQACPR5oOpSZhXyabNm3iuuuuwzRNPvzhD/P222/zwgsvqC5LCFeJRqMMDQ0xODjI1q1bufHGG4nH43z0ox9VXVrNkV+fZfDSSy+xbds2vvWtbwFw4YUX0tvby6ZNm1i/fr3i6oRwj0svvXTC330+H9/73ve47LLLFFVUuyTsy2DTpk10dnayceNGADRN4/rrr+cHP/gB3/jGNzAMQ3GFQrjDt7/9bZYtWwZAf38/P/jBD/j0pz9NOBzmuuuuU1xdbdFs27ZVF1FLCoUCc+fO5eKLL+av//qvx1//m9/8hg996EM8/PDDXH755QorFEK9u+66i0996lO88MILnH322eOvtyyLM844g8HBQfbs2YNpmgqrrC3Ssy+xJ554gr6+Pn784x+zdOnS8ZcPfehDAHKjVogT0HWdjRs30tfXx9tvv626nJoibZwS27RpEx0dHXz729+e8raf/vSn3Hfffdx5550EAgEF1Qnhfvl8HoB4PK64ktoiYV9CqVSKn/70p3zwgx/kAx/4wJS39/T08KMf/Yj777+f66+/XkGFQrhbLpfjkUcewTRNTjvtNNXl1BQJ+xK6//77GRsb473vfW/Rt2/YsGF8gZWEvRDw4IMPsm3bNgAGBgb44Q9/yNtvv82tt95KJBJRXF1tkbAvoU2bNuH3+487bUzXda6++mo2bdrEkSNHaG1trXCFFWbbkMuBroNhgKaprkgZ27bJW3kKdsH5v1UY/7NlW+iajmmYmIaJV/fiNbyqS66Iv/iLvxj/s9/vZ8WKFXznO9/hs5/9rMKqapPMxhHTl83C6ChEo5BMOn/PZiGTKf7nXG7iv9c0J/QN451fAMf+3e+HhgYIhaa+uHS6ajKXJJ6NE8/GGcuMOf/POv9P5pLjwW4zs8tMQ8NreMd/ARz9JeD3+In4IjT6G2n0NdLob8Q0ZMaKODkJezGRZUEs5gR6NOqE+9GAT6XU1eX3vxP84TC0tkJHBzQ1VeThR1IjDCYHGUgMEMvExoO9YBcq8vgn4vf4x4P/2P83B5rRNZlwJxwS9vUuFoPDh6GvD/r7nb9bluqqps/rhfb2d146OpxfCKcgmUsykBgYfxlKDpEtZEtUcOV4dA/twXa6w910hbrobOism/aQmErCvt6MjjrBfvQlkVBdUen5/U7ot7dDdzd0dTltouMYSg5xMHaQ/kQ/g4lBErka/JrgtIZag610hbroCnXRHeom4JUpwPVCwr7WxWKwb9874Z5Oq66o8rxemDMH5s2DuXPJ+U0Ojh1kX3Qf+6L7SOaSqitUJuKL0BvpZVHzIrpD3Wh1fBO91knY16J4HHbtgp07YXBQdTWuUPDqpFp8JIM2sQAMmjoH9BwjWu7k/7hOBDwBFjYvlOCvURL2tSKZfCfg+/tVV+MKBdMg2WKSDNpktHTR+TA5r5dhn5eDRp5Brfr68uUiwV97JOyrWSoFu3c7AX/4sDOvXZBuNBlrNkgZqRlNeMyYJn1+g11ampwmX8ujjgb/kpYldIW6VJcjZknCvhodOABbtzq9ePn2AWDpGokOP2MNBXKc2gjd1nWOBHzs8uSlzTNJS6CFVe2rWNq6FI8uazKriYR9tcjlYPt2J+RHR1VX4xq5oJexNi8JbxqL0k8ZTfpMDvgM9uqpMnz06mUaJstal7GqfRWN/kbV5YhpkLB3u0QCtmyBbducVakCG0i1+hmLQFqvzOyigmEwEDDZ5ckRJ1+Rx6wW8xvns65rnbR4XE7C3q2Gh+G112DHjupa5FRGtq4x1hlgLJglrzBwYwE/b/kKDCMtnmN1NHSwtnMtC5sWyg1dF5Kwd5uhIXjxRacfLwBnJJ/oCBAN55SG/GQjQT9vevOMae6pyQ1aAi2cM+cc5jXOU12KOIaEvVskEvDCC05fXoxLtfgYabZP+aZr2Wgw2BDkDU+atHT1J+gJ93DunHNpb2hXXYpAwl69XA5eecXpy+dlhHhUJmIy2qaR1jKqS5kWW9fpC/rYZsi0zckWNy9m/Zz1RHyyP71KEvaqWJZz0/Wll9TuJukyuaCX0Q6DpFGd2zoUDIMDQZO39TQFCf1xuqazsn0lZ3afid/jV11OXZKwV2HvXvj1r2UK5TEKPoNop0ncO7OFUG6V93jY2+Blhya/yI9lGibrOtexpnONzNOvMAn7ShoehmefhUOHVFfiKvHOACOhTFnmyauW9Pt4xVeQm7iThM0wFy+4mJ5wj+pS6oaEfSXYNrz6qjPLRqZRjsv7DIZ7vKQqNFdeFVvX2Bfys02XUf5kK9tXcu6cc2Wf/QqQsC+30VH4xS9gYEB1Ja4S7wgwEq7N0fzxJH0+Xg0UiLlo+qgbyCi/MiTsy2nLFmc6pcyyGVfwGRypg9H88Tij/ADb9PrdQ/94ZJRfXhL25RCLwVNPOYeFiHGJ9gDDkfoazR9PyufjVb9FVDZam0BG+eUjYV9qb7zhzLTJyUV8VME0GJ7jJVmno/njsXWN/Q1OL9+W3QUmWNm+kg29G2TGTglJ2JdKKgVPPulsPyzGJVv9DDflKFBQXYprJf0+XvDnZAXuJM3+Zq5YcoUsxioRCftSGBqChx+uzcO7T0F0TpBRv/SmpyPv8fBKg84ROS1rAtMweffCdzO3ca7qUqqehP2p2rEDfvlLuQl7DEvXGJ7nJ2HIVMOZsHWN7WE/e2Qh1gQaGuvnrOf0rtNVl1LVJOxny7admTavvKK6ElfJ+wwG5xhkZYQ6a4dDAV4zpI8/2aLmRbxrwbukjz9LEvazkc3CE0/INsSTZCImg+0F6c+XQDzg5wVflqz08SdoCbRw+eLLpY8/CxL2MxWNOv152ddmgnhHgOFwGrsmdrZxh6zXy8tBZHrmJD7Dx7sXvZveSK/qUqqKhP1M7N8Pjz8uxwMewwZG5waJmXIjthwsXeeNsMlBTaatHktDY0PvBtZ0rlFdStWQsJ+uN9+Ep592evUCAMvQGJrnq9vVsJW0NxKUVbdFnNl9Jmf3nK26jKogYT8dr7/u7FYpxlkenYF5HjJyI7Zi9keCvCGBP8XazrVs6N2gugzXk7A/mVdfdVbEinES9OocCAfZakjgT7aqfRUXzLtAdRmuJmF/Ii+/7GxLLMZJ0Kt3MBzkdQn8KZa3Luei+RehaTJntRgJ++N58UUn7MU4CXr3OBQOskUCf4rFzYvZuHAjuqarLsV1JOyLef55WSw1iQS9+/SFg7wmgT/FgqYFXLroUgn8SSTsJ9u82dmHXoyToHevw6Egr3ok8CfrjfRy+eLLZbXtMeRX37GeeUaCfhIn6L0S9C7VFU9yej6ougzXORA7wJO7n0TGsu+QsD/qlVdg61bVVbjKO0GfUV2KOIFOCfyido/uZvOBzarLcA0Je4Bdu5w+vRhnazAoQV81OuNJllkB1WW4zusDr7OlX56tg4Q99Pc7h46ICUbmBkhL0FeVhWMpemyf6jJc57kDz7F7ZLfqMpSr77CPxZxNzQqyS+OxxroCjHllT/WqY8OqsRwR5KbksWxsntzzJAOJAdWlKFW/YZ/JwEMPQVr2dTlWusnHSIMEfbXSLYuzEhpmHV/axeStPA/teIhYJqa6FGXq8yfCsuDRR2Wb4knyAQ9DrXnZpLjKmbkc56RNNPlGTpDOp3nw7QdJ5+tzgFefYf/LX8KhQ6qrcBXL0Bjo0eXgkRrRkE5zRkFm6EwWzUR5eMfDFKz6+zmvv7D/zW9g+3bVVbjOkXk+cshc+lrSLjN0iupP9PPcgedUl1Fx9RX2fX2ysVkRo3MCJGVP+pokM3SK2zq4lT2je1SXUVH1E/bZrDPFUlbUTZBoDxD1yw3ZmvXbGTohmaEzxVN7niKRTaguo2LqJ+x/+UuIx1VX4Sq5oJcjERnR1zrdsjgjbaguw3UyhQxP7H6ibrZUqI+wf+stZ5WsGGcDR7p0OSC8TgTTGVZYcsN2sr54Hy/31cdW5rUf9tGos8GZmGCsJyhbIdSZefEUjbZXdRmu83LfyxyOH1ZdRtnVdthbFjzxBOTzqitxlVzQy2hA+vT1RrNsTk9rMv9+EhubJ3Y/QSZf24Of2g77F1+EwUHVVbiKtG/qmz+TZaVMx5wino3z1N6nVJdRVrUb9ocOOYeFiwmkfSN64ylakHbOZHtG97BtaJvqMsqmNsM+n4df/EKmWU4i7RsBgA1rk1qNXvyn5vmDz9dsO6c2v98vvyzTLCdx2jeatG8EAL5sltV5aedMls6nef5gbZ5tUXthH43Ca6+prsJ1nPaNbIcg3tEdT9GBqboM19k2tI3BRO3d66u9sN+82ZmFI8ZJ+0Ycz8okMjtnEhubp/c9XXOLrWor7Pftc17EBMNdhrRvRFG+bJZltrRzJhtMDtbczdraCftCAZ59VnUVrpNq8ZPWZEsEcXxzE1k57KSI5w8+X1N739fOd/i115xjBsU4Gxhprr99u8XMGIUCq/J+1WW4TqaQqambtbUR9omEs0+9mCDeFSBHTnUZogp0JJJydm0R24a21czZtbUR9s89J1siTGIZGtEGmX0jpsmGlVlZaFXMM/tqY2+t6g/7w4dh507VVbhOrDsgRwyKGWlMpmiTqZhTDCYHa+Kgk+oPezl5aoqCV2fMVzs3lkTlLE9rqktwpZcOvaS6hFNW3WF/+LAcHF5ErMuPhaw1EDMXSmfolmMMpziSOsLukd2qyzgl1R32L9fHoQMzUTANxkxZQCVmb6k8KSzqpb7qHt1Xb9gPDMCBA6qrcJ1Yp08WUIlTEshk6LVlKuZkw6nhqh7dV2/Yy6h+ioJXl1G9KIn5GRkwFPNqf/Vum16dYT8yItsiFBFv98uoXpREKJ2RIwyLGEgMcGisOu8TVmfYy66WU9hAPCDz6kXpLC5I2BfzyuFXVJcwK9UX9skkvP226ipcJ9XiI48sLBOl05pM47VlKuZkB2IHGEoOqS5jxqov7F9/XbYwLiLeKBelKC3dslgkN2qLen3gddUlzFh1hX2hAG++qboK18kFPKR0mS8nSq8nJc8Wi9k1sotcobr2naqusN+7FzK1eT7kqYi3Sm9VlIeZy9Eji6ymyFt5do3sUl3GjFRX2G/frroC17F1jYRPbsyK8lmQlRZhMW8deUt1CTNSPXuaplLKFlF9+8knue3RRzkcjbKut5dv3XAD5yxcqKSWyRJtfgrU19z6X7+2ne/+5BG2vL2PgSNR/vmvbuSKC04ff/vgSIz/719+yq9eeoNYPMk5a5byV39yAwt7OwHYf3iI//HRrxT92N/+6h9y9cVnAfDqtj383b/9lC3b96FpGuuWL+DP/vA6Vi6eW/bP0U3CqTRh08OY5p6WzpM/eZJH/+NRokei9C7t5YZbbmDh6spek4fjh4mmozT6Gyv6uLNVPSP7HTuU3Ji9+4UX+OK99/K/rr6al7/yFdb19nLFHXcw4JKDUuKh+tvZMpnOctqiXr72uQ9PeZtt2/zhX/wT+/sG+Ze/+n944M4/Z05nKx/98j+QTDktwJ72Fp7/yd9PePnCJ66lIeDjXeesAiCRSvOJP7uDno4W/vMfb+Xef7iFUNDPx2+9g1y+/r7miwvu2Q3zhUde4N7/cy9Xf+ZqvvKDr9C7rJc7PncHseHKX5Pbj1RPt6F6wl5RC+ebjz3GZy68kE9dcAEre3q48yMfIWiafM8FRyBmwyYZrf5aOBvPWc3Nv/87XHnhGVPetvvgAL95czd/c9NHWLdiAYvndvG/b/o90tkc9z/5AgCGodPR0jjh5eGnX+Hqi8+mIeDMPtm57zCjYwm++In3snhuF8sW9HDTx65haCTGwf4jFf183aAtlXHNweSPbXqMC3/nQi547wX0LOrhI3/2EUy/ybP3V/6a3H5ke9UcTF4dYT88DEcqf4Fl83le2rePS087bfx1uq5z6YoVbN6l/uZMvNlQXYLrZLNOq8FnvnPTWtd1TK+HF17fUfTfbNm+lzd27uf6qy4Yf92iuV00Rxq4+8FnyObypDNZ7n7oaZbM66a3q7W8n4QLGYUC3ai/UZvP5dm3bR+nnTvxmlxxzgp2vVb5azKRS3AgVh17dFVH2Csa1Q/F4xQsi85weMLrOyMRDkejSmo6VspbXVO/KmHxvC7mdLTw9/96H9GxBNlcnu/8+CH6BkcYOFL8e3b3g8+wZF43Z61aPP66UNDPj7/xJf7z8V+z4uo/YeW1n+epF7Zy19c/h8eoz1+yXQX1n3d8NI5VsAi3TLwmIy0Rosf5/pZbtdyodX/Y27bTrxcTZENeWTFbhNdjcOdf/hG7Dvaz7v1f5LSrP8fmV97iXeesRtenzipJZ7L87InnJ4zqj77+y9/4PmetWsx9d9zKvf/wZZYvmMPvf+UfSWfqr3UG0Jyuz8/7ZPaO7iWTd/+UcPfPxtm/39kiQYG2UAhD1+kfG5vw+v5YjK5GtXfgk40ekMPEi1qzbD4P/vNXicVT5PJ5WpvCvO9Pvs7aZfOnvO9///Jl0pks1122YcLrf/bE8xw8fIT77vhTdN0ZE93+P/+Ade//Ao88+yrv3bi+Ip+Lm3jyedowGUJd6IeaQuiGztjwxGsyNhyjsVXNNVmwC+wZ3cPytuVKHn+63D+yV9gbNz0ezpo3j8ePWbVrWRaPb9vGeYsWKasLIOWvvxkhMxUJBWhtCrP7QD9btu/lsvNPn/I+dz/4DJeet47WpoltgVQ6i6ZraNo7zwZ0XUNDw7aq44ZcOfQU1I4PPV4P81bM483nJ16T217YxqK16q7J/bH9yh57utwf9ooPKPnipZfyL08/zb9v3sybfX3c+MMfkshm+dT55yurKe8zyCocXamWSKXZumM/W3c4F9j+viG27tjPwf5hAB546iU2v/IW+w4N8sgzr/DRP72dy88/nYvOXjnh4+w5OMDzW96e0sIBuPCslUTHknz1jh+xY28f2/cc4pbb/h3D0DnvdHeP4MqpJaO+dXjpRy7l6f98ms3/tZm+3X388Os/JJvKcv616q7Jg7GDrp+V4+42zvCwshbOUdevX89gPM5f3H8/h2MxTu/t5aHPf57OSERZTakmE+psIdWxXntrLx+++Zvjf/+bO+8B4HcvP49vfPmTDAxH+Zs772FoJEZHSyPXXbaBz3306ikf5ycPPUN3W9OUXwIAS+Z18W9/88fc/v3/4v2f/zt0XWPVkrn8+9c/T4eidoEb+LJZIkEPMYX3i9Zfvp74SJz777yf2JEYvct6+fy3Pk+kVd01mSlkGEgM0BnqVFbDyWi2m38dbdkCmzerrsJ1Bhb6SOnuvyEkatP+SJA3dLWDMDc6s/tMzu45W3UZx+XuNo6cMTuFpWuk9fpt4Qj12jJyv6iY/VF39+3dG/aWBX19qqtwnXSzHCgu1ApkMgRs9XPu3WYoOUQ6796txt0b9ocPQ179zSC3SYZUVyAEzME9e+W4hY3t6tW07g17aeEUlfbI3HqhXpOMw4pycytHwr6K5P0eCki/VKjXkJO0L0ZG9jOVTivZ+Mztsg3unikr6oc/l8OQw8inSOVTDKeGVZdRlDvDvq/P2RNHTJANuPPbJeqQDa2aHIdZzJGkOweq7kwPGdUXlfVW/vAWIY6nxZJnmsUcSbkzvyTsq0hWl5uzwj0a8/Lsu5ih5JDqEopyZ9gPu7PnpZLcnBVuE8zJ4KMY6dlPVy4Hk7YUFnJzVriPmctjujBCVEvn08SzcdVlTOG+75SM6ouSm7PCjdosuUlbjBtv0rovQSTsi5Kbs8KNWmTbhKLceJPWfWEvN2eLkpuzwo3CeRmEFOPGm7TuC3sZ2U8hN2eFW/kKEvbFSBtnOiTsp8j75amycCevbFZY1Fh2jGzBXVuRuyvs43HIuusL5AYFr7u+TUIcpVsWHmTbhGIS2YTqEiZwV4rE3TddyQ0KXrmYhHs1yE3aopI5d53m5a6wT9XvuaonUjBkpaJwrwYk7IuRsD8RCfuiCnItCRcLuixG3CKRkzbO8UnYF1XQZcaDcK+AJW3GYmRkfyIS9kXlZdqlcDGfJW3GYiTsT0TCvqiCJmEv3EvCvjgJ+xORsJ/C8ujYyMUk3MsrC6uKkrA/EQn7KQqm3J0V7iYLq4qTsD8RCfsp8qa7vkVCTKZbFpo8+Zwib+XJFdyzp5V7kqRQkNWzRViyelZUAU0m5BSVKWRUlzDOPSdiZNzzRRG1wdK82LYB6Niajo0Otoatac4Cf9vmt39Aw0az8+hk0JAe9EzpaFhyb2kKy3bPz5J7wt6WH5RibBkxFWUDFn4Kmh8LH3nLJG95yRcM8nmdXF5jtpNEDAM8ho3HY+HRChhGAV3L4iGPrmUwyKDZGdkR5hiaDfIFmcp2Ua65J+yFOA4bk6zWSLrQQDZvksvr5HOUbRxZKEChoJHJGjC+FUBgwvvoGvh8Fn5vBtNIYRJFt+v32ankfHFumkknYe92LhoZVEqBAFkayRSCpDNeMjn3RYllQyqtk0oHcH4RtODx2ATMAj5PGq8ex2vF0DT3PI0vJ13TKN+v3+olI3sxfXVw5ytHiByNpPMBUhkP1TqTL5/XGMt7GCMEhNDowmda+H05AkYUrz1csyNgvWY/s1MjI3tR9/JamGS+hXg6QK5Kw/1kbCCd1UlnfYzSgcfTQSiQIWCMYNqjqssrKenZFycje1GXCvhJ2W3E00Ey2fqbUprPw+iYj1G68Hi6CAXSBPURvERVl3bKJOeLk5G9mL4qv4psPKRoI5EJk0zLauCjnOD3M0o3prebkD+N3xjGa8dUlzYreh20G2dDRvaiptlAVmsjkW0kkfLOegpkvcjmYDjnB3rwebuJBMcI0I9WRbudShunOBnZi5pko5Oii9FkhJx7VolXlUxOYzAawTAiNDakaND60HH/ynK5Qet+EvbilNl4SNjdRJMNVTuTxm0KBRiOBRjVFhFuyBL29GPY7jr56FhZWXVclFf3qi5hnHvC3uueL4qbuHmato2HuD2HaDyA7HJbHpYN0bhJlLlEGnJEvIddGfopOXOhKL/Hr7qEce4Je9N01qkX5IfmWEbOfSlqY5CwehhNNEjIV1As4SXGXMLBHBFzAI89prokACxdx5KRfVE+j091CePcE/YAgQDE46qrcBU9655ffjY6SbuHkURIficrNJb0MpacQ2MoS8SzH91We4OkYOggYT+Fz/Cha+6ZYixh73JuGdlntRaGEh1y49VFonGTuLGY1tAoAQ4rqyPvokBzEze1cMCNYS8mMHIWKncdsTQv0dxcYglTUQXiRAoFGIg2EfRHaPEfVNLPzxsS9sVI2J+IhH1RBh7yVH6aS1rr5MhYM3lp2bheMq2TSs+lKZwirB+o6Bz9nC7TLouRsD8RCfuidFuv6IIVSwswku0lnpQVr9XEBkbGAiS8S2lpGMJnD1XkcXOyerYoCfsTCQZVV+BKRoXC3gZSzOFILIzljlsFYhayOTg82kYo2ESzeRDdLu/ZznW4zdG0SNifiIzsizIKWtlPC85rIYbTPaTScuXWinjSQyo9n/bIEXz2YNkeJ+OiLQHcxG1h764rW8K+KMMq77A+STeHRnsl6GtQwYLDo63ErPlli+S0m1f+KRT0uqtT4a6rW9o4RRn5cl2mGtHCQgajjTI2q3EjYwGGskuxKf2sqpSEfVHNgWbVJUzgrrCPREB3V0luYORKH8U2JoOZpYzG3bPCT5RXMmXQl1hEjsbSfVANRpHFF5NpaDT5m1SXMYG7klXXoalJdRWu402WdtplXgvTl1hEUto2dSeXh75oNwm6S/LxMl5T1s4WEfaF8ejuuiXqvqu9tVV1Ba7jTeXRS/StSmud9EXn1OxRgOLkbGAo2shIYTH2Kf5cpTwyPbeYZr+7WjjgxrBvaVFdgSuZ9qntCmoDMWs+/aPNcpiIACAW9zKQWkpBm/3EiDGPzLEvxm39enBj2MvIvihvbvbfKhsPw7mljIzJbCcxUTqr0Tc2n7wWntW/j8rN2aJaAu4btLov7GVkX5SZnt1w3NJ89CcXy2pYcVyFAhyOzSGnRWb8b4fl5mxR0saZjmBQ5tsXYSZnvteJpfkYSCwgk5On2uLEChb0x3pmNFMnb+hyaEkRbpyJA24Me5DRfRHeRA5tBnsmWJgS9GJGChb0j3WT05qm9f4Zr+yEWkzEF8HQ3fdMWsK+SmhM/yatjclAaqEEvZixggWHY13ktJO3IeIed8aHam7s14Nbw15u0hZl5k8+WrAx6U8tJJOVoBezY1lwONpJVjtxaMV0uTlbTEdDh+oSinJn2He484ulmpk58dstzeuM6CXoxSmybOiPdpDh+AOvUV369cV0h0uzYK3U3Bn2TU2yT04RJ7pJa+NhMLmItAS9KBHLhoFYOxmtberbdJ0RxWffupFX99IWnPr1cgN3hj1AT4/qClzHG88WvUlr42EgvViCXpScZUP/aBvZSTdtx/w+bPlxm6Iz1OmqQ8aP5c6qQMK+CM0GvzVx4zIbg8H0ItIZufJEedjAwFgXBd55tj3srm1fXKMn7N7ckrCvMoHUxFAfzS8glXHvt1HUhkIBBpNzsX973tFhXVo4xUjYz0Yk4ryICfzRdy6yuD2XWOLU9swRYroyOY2h7EKyhocYspPeZH6Pn/Zgu+oyjsu9YQ8wd67qClzHm8rjwUNGa+NIrEF1OaLOJFMGB7XFqstwpTnhOWguPnzd3WE/b57qClzJk40wGHPnHX9R+0by3QSsparLcJ25je4enLo77Ht6wCN3go5laR6S8RUUZD2LUEHTGcYkPbYQ03Zvy0KF3kiv6hJOyN1hbxhyo3aSYf9Z6KNh107vErWtEAhSQMO2NazEWnT8qktyhfZgu+sOGJ/M/Ykxf77qClxjLLCcRKoJbGjQpF8/G/c9eB/X/9H1XHbDZfzRrX/Em2+/qbqkqhL3vrMjbT7vwcycpbAa91jSskR1CSfl/rBftMgZ4de5rNnKSPqdX3zBrLtHEW70xDNP8O27vs0nPvQJ/uW2f2Hx/MXc/Nc3MxIdUV1addB0Bpm4/Xg6FcJfcH/QlZOGJmFfEj5f3Y/ubXSOsAb7mCWLvphPWjkz9JOf/4RrLr2G91zyHhbMXcCXPvsl/D4///34f6surSrkA0HyRVZwZxOL8BBSUJE7zInMIeB1/xkc1ZEWy5aprkCpWOA0stmJK2c1SyNUxxfYTOVyObbv3M5Za99pO+i6zllrz2Lr9q0KK6seMbN469CyNIz0GRWuxj2WtVZHPlVH2M+dW7cbo+W8TUTTc4q+rSElffvpio5FKVgFmpsm7tPe3NjM8OiwoqqqiG4wZPuO++ZMOkigsKKCBbmDV/eyoGmB6jKmpTrCXtNgift7YqVmo3FEWzehfXMsM27i1WUFrSi/bDCEdZKT0tKJeXjt6R9rWAsWNC3Ao1fH9PDqCHuoy1bOWHAFmeyJp7aFrXCFqqlujeFGDN1gZHTizdiR6AgtTe48WchNRoyTP7O2LQ09vY562g5zaWv1LC6rnrBvaYG2+lk1mvNEGE2dfEVeMF6f7a2Z8nq9LFu8jJe2vDT+OsuyePm1l1m1bJXCyqqA12SE6T2DzGQCBK36aOcEvUHmhIu3WN2oesIe6mp0P2wcv31zLCNtENDdPxPADT507Yd44LEHeOjJh9hzYA/f/O43SWVSXHXJVapLc7V4IAIzOOw+nehFP0F/v1Ysbl7s6r1wJquOZtNRS5bAc885h2TWsKR/Pun09Efs4UyYlDdVxopqwyUXXMJodJTv/fh7DI8Os2ThEm7789ukjXMimk6/HnA2tZ8my9IJFlaR9LxcvrpcYEVbdT2D0WzbnsG30QUeewx27VJdRdnY6PR5LyaXM6f/jzQ41H6InCV7jIvSyoYa2WU0zfwfauCNPEdOi5a8JjeY1ziPK5dcqbqMGamuNg7A6aerrqCs4oElMwt6ABsiBdn7X5TeoGeWazlsMLIrS1uMi6zrXKe6hBmrvrBva6vZfe4tzUM0O7ttnYPRoKyoFSVlBYKM2bPv9KZTEXx2dwkrcoeOhg66w9X3eVVnOpxRm6v1xgIrKBRmtw+QnteJIKN7UTqjvlOf1munlpegEnc5vet01SXMSnWGfVeX81JDCrqfWPrURguhMdk+QZSG7TUZKMGMmmzWh9+qnZOtmvxNVbNidrLqDHuoudF91L8Syzq1b4eRNgjrsshKnLrRhmZmMt3yRPLJBTWz0Gpt51rVJcxa9Yb93Lk1s8gqbzQQT5bm1J/ImLRyxKmxvT76SzhPPp/3EKD6d64NeoNVs+lZMdUb9lAzM3PGfEtnMo35hDwpD2FNRvdi9kYbmijVqP6oQrr6w35Nx5qqngRRvZUDLFwITU2qqzglluYhni7tWZ6NY/W1GZUonVKP6o/KZvz4qN77bKZhclr7aarLOCXVHfaaVvWj+4R/0Sn36icz0gYRXdo5YubKMao/SsssLMvHrYQzus7ANGa4/sVlqjvsAZYudTZJq1Jj+fJspBSJRtDKdNGK2mSb5RnVH5VORapyC+SIL8KazjWqyzhl1R/2mgYXXKC6illJ+Xpmvlp2moyMQaNWfReWUGcoULoZOMfjyVfPlsBHndd7XlX36o+q/s8AoLsbFlffXN4xrbxPayMjEQxNDmsXJ5cPhjhC+XeqTKda0DnxGQ1u0hvpZX5T9d9chloJe4ANG8BTPZt45jwRUunyLoLS8hotheptcYkK0XQOeZsq8lC2peEvVMfATNd0zus9T3UZJVM7Yd/QAGeeqbqKaYublTlmMTAcwKfX/t7iYvZSoUaSVO4ZYC7dUbHHOhWntZ1Gc6D55O9YJWon7AHWroVG9/epbTQSmcqMuDU0WpIyuhfH4fFwoMKrrnM5ExN3L4j0GT7O7jlbdRklVVthr+tw/vmqqziptK971huezYYZN2UqpihqtKGFgoJZW0bO3TvXnt1zNj5PbT0jrq2wB2cbhfnuvqGS0Cp/bmXjSGNNzCgQpWMFghxGzZGW2XSra/fLafY3s7K99vbir82r/7zzwHDnLBRbM0hlmyr+uHpOp7XQWvHHFS6l6+z3qWvvFQoGPty3J7yGxkXzL6qqs2WnqzbDPhKBs93Zb0v7ekq+Yna6gsNBGvQGJY8t3CUabiFlqx0Q6fkepY9fzBndZ9AZ6lRdRlnUZtgDrFsHcyrfLjmZpKZ2f5Dm0WaZe1/nCoEgfaj/pZ9NN7mqldMebOfM7uqZ0TdTtRv2ABs3gt89CzhsdFJZtbOFjKxBa17aOXVL1zngc8f3302tHI/u4ZKFl9T0fa3a/cwAgkG46CLVVYzL+LoqOgvneAIjAUK6nGpVj6LhVlK2ey57o1DaHV9na0PvBhr97p+2fSrc810vlwULYKU77qyndHf8YAM0j0g7p94UgiH6CKouY4JCTn3AzmucV5Ozbyar/bAHZyuFZvUr4TKW+h/so/ScTnvGPb98RJl5vOwx1V8Dk2WyATTbq+zx/R4/F8+/WNnjV1J9hL3HA+9+t9LpmJbmIZtRM6f5eHwxHy3I6trap9EXaifnovbNOBtMW93sl4vmX0TA667rslxc+N0vk5YWOPdcZQ+fNTtKdvRgKYWGQgQNdz21F6U11thGVOHo+WQMS80zzBVtK1jQtEDJY6tQP2EPsHo1zJun5KHThjv3AtHQaDvShld3bxiI2cs3hDnosj79ZHkFM9S6Ql1cOO/Cij+uSvUV9gCXXKKkf58puKdfP5mW12hPtMvJVjXG9vrY7XFfn36ybNaHXsYTsiYLm2EuX3x5TU+zLKa+PlsA04SrrnKmZVaIjU4m6+6+oDfhpc1y57MPMQu6wYGGdiWbnM2GWaHDyE3D5MolV+L3uGf9TaXUX9gDhEJwxRUVO+wkY7Zju2il4PEEh4M0aU2qyxCnTGMg0kFC8XYIM6EXyv8MREPj3QvfXVN71M9EfYY9QHu709KpwIZHWY87VixOR2QwIguuqtxoYzvDdnnONi4Xq1D+7RvOm3secxvdvbVyOdVv2IOz4GrDhrI/TM5Wvw/JdGlotAy1ENDd3XYSxSUjLcq2LT4V+Vx52yor21eyumN1WR/D7eo77AHWrIFVq8r6EDmrui4+zdJoG5EZOtUmF4qwT6vsqVOlks970ChPW3VOeA7nz3X/oUblJmEPzulWZZySmc9V11NqcFbYdsY6ZUuFKmEFguwyqrsX7aWp5B+zyd/EZYsvq7uZN8XIVwCcvv2ll0Jb6WejFHQfBas6A9NIG3QmO+VCcTnLF2Cn2ebKRXszoZd4O5FGXyPXLLsG06i+wVY5yFV8lMcDV1/t3Lgtoby3qaQfr9K8CS+dKQl8t7JNP7sDbVUzxfJEdKt0LagmfxPXLr+WoNfdC8oqSa7gY/l8TuB3lm6vjlwNHPRtxk060h0S+C5jmz52BzrcuefNLFiF0gRzk7+Ja5ZdI0E/iWbbdrU/+yu9XA4eegj6+k75Q40E1hFLqT2dqlSykSz9vn4s21JdSl17deur/Ojnd/PmrrcZPTLAjX/1z5x+wRXjb3/5Vw/xy//axL7tW0iMjfLndz7A3CXFJyHYts23/ucn2frCUxM+zrMP38O/33ZL0X9z2z0vEmkufcvT482Rb3jilD6GBP3xVWZVUbXxep1Vtg8/DAcPntKHytvl+aH79fZf891HvsuWfVsYiA7wzzf+M1ec/s4F/9DLD7Hpl5vYsm8Lo4lRHvjzB1g1d+IF/2c/+DOeefMZ+qP9NPgaOHPxmdx63a0s6Voy/j6v7nmVv/vp37Fl3xY0TWPt4rX8wSf/gEULFpXl8xInlyrkaV16Ojdc/THu/Ms/mvL2bDrJktVnc/bFV/Mf37z1hB/r8f/7b0UP1z77Xdeyav3ErX/v+vubyWczZQl6gHz+1GZ/SdCfWG08/ysHjweuvBLmntoijLxVnumLyWyS03pP42sf/tpx3372krO59brjX+xr5q3htk/cxmN/+Rjfv+n7YMPH/+HjFKwCAIl0gk/c8Ql6Wnr4z1v/k3tvuZewN8wtX7sFqyCjexUsX4CO//F+rv39WzjjwiuLvs+Gy67jmo/dxIozLzjhx9q/YyuP3vuvfPzmv5/yNtPnp7GlY/xF1w3eemUzF1x1fUk+j6JsZr23vQT9ycnI/kQMw9lW4dFHYe/eWX0IyyrPl3jj6o1sXL3xuG+/bsN1AOwf2n/c9/m9i35v/M9zmcuX3vclrvrrqzhw5ADz2+ez8/BORhOjfPG9X6SnpQeAm665iSu/diWFfQW8i7wU7EKJPiNxMoVgiF3elpLcjM2mU/zb397Ehz/3NRpbOk76/s89+lNMn58zL3rPKT/2iRj4yZOb0b9p8jdx7bJr62Zf+tmSkf3J6Dpcdhksml3bwqqSaZfJTJJ7nr2HuW1z6W52DoFe1LWI5oZm7n7mbrL5LOlsmrufvpsl3UtYEFxAd6xbFl5VSDbUyA5va8lm3fzkO19j0aqzOP2Cy6f1/s88eDfnXPI+TF95V7rqzOzjdzR0SNBPk4zsp0PXnZOugkF4/fUZ/VPLcvfv0//4xX/w9Z9+nWQmyaLORfzg//0BpseZlxzyh/jxl37MH37nD/nWA98CYEHHAr5/0/fxGB7IQNdIF4PNg6SttMpPo6Ylwy3s00s3LfHVZx/lrVc285U7H5jW++984yX69u3gU7f+n5LVcDw609/qeEnLEi6efzGGXh0DKtXcnURuomnOStuLL3bCfxoKmvsXc7zv3PfxwFce4O4v3c2izkX88Xf/mHTOCe50Ns2Xv/9lzlp8Fvfdeh/3fvlels9Zzu//4++Tzjrvo+d0OoY6aNCrZ/+fahJrbC9p0ANse+VZBg/t5QvvW8uNly/mxssXA3DnX93IN744tSf/zH/fzdzFK5m/bE1J6yhGm+a+9ut71nPJwksk6GdARvYztXw5NDU5ffxk8oTvahl+yFemrNmKBCJEAhEWdi7kjEVnsO4L63j4Nw/zvnPex8+e/xkHjxzkvj+9D/23v+Bu/4PbWfeFdTzy6iO8d/17gd/upTPYhqfdQ9SKqvx0aoducCTczuAMRrrTdeUNN3LhVTdMeN3XPnMFH7rxq6zdcOmE16dTCV586gHe/wdfLnkdxWgn2a3To3vYuGAjC5sXVqSeWiJhPxudnfD+9zuBPzBw3HezqmBkfyzbtrFtm2w+C0Aqm0LTtAlT83RNR9M0pizPsKFpoAmz2WTIGMKu+sX76timjwPB9uPuR59OJRg8uGf870N9+9m/YysN4SZaOueQiI0yPHCQ0SPOz+bh/bsAiLS0T5hhM1lLRw9t3RNnn734i//CKuQ599LfKc0ndzInCPuQGeKKxVfQGqyeLcPdRMJ+thoa4Npr4Ve/gu3bi76LZfiY4cSCaUukE+wZ3DP+9/1D+9m6fytNDU3MaZnDaGKUg8MHGRh1Lvhdh50Lvj3STkdjB/sG9/HzF3/ORSsvoiXcwuGRw3znoe/gN/3js3wuXHkhf/t//5av/uirfHLjJ7Fsi+889B0M3eC85ecVrSs4EqS7oZuBhgHylsuf1rhQPhhmt7eZwgkOu9n71mt88+YPj//9njv/BoDzLv9dPvnlb/Dq5kcnLIj61//9OQCu+dhNXPuJL8yonmcevJszLrySYKgyx2rax5l62dHQweWLL5epladAVtCWwpYt8NxzMOlLmQgsYCi1vCwPufmtzXz4mx+e8vrfPe93+cYnv8E9z97DLf8+dQXkTdfcxBeu/QL9o/386X/8Ka/vfZ1oMkpbpI1zlp7D56/+PIu7Fo+//6/e+BW3/9ftvHXoLXRNZ9XcVdz8Ozdz5qIzT1if7bEZah0iWThxq0u8I97YygHq++CYQHCYlPnChNfJjdjSkLAvlYMH4bHHIJMZf1UisJCh1DKFRallYzPWPsaIPaK6FHczDAbCHVV3ulQ5BBpGSHmfB8DQDDb0bmBVR3nPm6gXEvallEjAL34xvsVCvYf9UZlIhiHfEHlb2jqTFYIN7DNbyNTIZman6mjYtwRa6vq82HKQsC+H11+H558n4ellKF2eNk61sT02wy3DxK246lLcQdOJRlroQ6asHisQHGVxb4Jz55wrbZsSk7Avl9FREs/sZOhgeTaNqlbJpiRHvEfqeudMyxfggL+VJBJmx/JgsKSxhYvOlpuw5SDPHculqYnBlWdyINiEXWRXwXoVHA3SE+shaNTjBa2RiLSy3d8uQT9JoNCAtbcHkvX4c1EZMvWyjAyPxtZkIwe8QdbpRwgcc/O2nhkZg7b+NpItSUaMkbrYTM3yB+jztzBmyyV3LA8ePCMtpIadvW0M+R1YNvKTV0ZHf3CjOS+/pIvlgTHmZ0bRrPptYRylodEw3EDAGyDaHCVmxVSXVB6GwWiolcMEkHVmx9IIZiKkDkXIH7N/1DR3IhGzIGFfRp5JX923UmEOGAHWBEZoTMn8c3D21mkeaCYUCnEkeISMVTvPfjKhJg54wjVzbGCp+G0/hcMtJJNTF1DJyL58JOzLqNgPbqLg4blUO21mluXaCKGM7BYJ4I176Up0kWhJMKwPV/UNXMsX4HCgmZjtldH8MTwYeGPNpAaPPwPJKztml42EfRn5T7A191DWZIhOun1pljIq/XwAGxqOOK2dsaYxona0qvbYsb0mI8EmBqRlM4GOji/ZSLo/TN468WSFBpmJWjYS9mUUDDo9yBO16PsyfvrootefYok1ii+brVyBLqXndBoHGwn5QsQiMWK2y/v5Hi/RUDN9th9KdLhILdDQCGTDpPsaSeWn18qSsC8fCfsy0jQn8OPTWEd0IB3gAAEWBBIszEcxc2XaQa2KGBmD5sFmwoEw0XDUfQuyDA9joSYO0TB5W6Q6pxHIN5A93EgyM7OIkbAvHwn7MguFphf2R+1JNbCXIIv9Cebno3jyssWAJ+WhNdVKJBghFoqpD32Ph3hDI300lOyYwFqgoRHIhcgOREilZxctEvblI2FfZqFZbGJoo7EjHWIXDSwLxJmTi0noA96kl9ZkK03+JuLhODFiFb2Ra5t+RgMRBghIS/4YBga+TIh0f5hkbvbTaUxTbtCWk4R9mZ3KSMVCY1sqzDbC9PhSzNMTRNJJtDrvGRhpg8Z0IxFPhERTgqgWLesma4VgiCFvmBFkV8pjefBgJsOk+kMkS3DWsozqy0vCvsxmM7Iv5lAmwCEC+PQCCwMJuvJxfNn67utreY3QUIgGrYF0U5ox7xgpK1WaD24YZIJhBozQcU+Mqk8agUIAKxoiMxIo6ambEvblJWFfZqUK+6MylsG2ZIRtROgwM8wz4rRkknW9KlezNQIjAQIEKPgLJEIJxvSxWZyUpZEPNhA1QwzZPqdVU99PosZ58GCmwmSGGkhly/PLT8K+vCTsy6zUYX+sgayPAXx4tGYW+JN0W3GC2fqer2+kDSLpCGHC5CI54r44CRIn7O3bpp94IMQgQbJoEvC/ZWBg5oJYsSCZUX9JR/HFSNiXl4R9mZUz7I/K2zo70iF2EKLJm2O+N0FTPoW/jufsa2iYMZMWWmg2mkmH0yTNJEk7iWVbWL4AKV+QYT0gbZpjTAx4H6kKzjaKRCr2UHVJwr7MfD5nrn2yQlvhjOa8jOaagCZ8eoFuM0ObliacS2HW6YweraDhizWQM1vJ6j76/Rp5T5aslqqLHTdPxsSLJxugMBaoeMAfq6NDycPWDQn7CujogD17Kv+4GctgTzrIHpw9wkOePN3eNK2kCWXTGIXaDrqMaTJi+Om3AgxkfFjp34ZYEhh2/miGs3jCaSxfmqyewaL2730YGHjzfkj6ycUCZDMGqp8Der3Q2Ki4iBonYV8BqsJ+snjew9v5EG/j9JZazSydnjTNhRQNuWzV3uS1NY2s10vCMBnTvEQLJsM5L5lp3EjMjplkx0wgAtiYodxvwz9DzshQoPp/IZqYGDkTMj7yCZNc3HTdZ9Xe7qw4F+UjYV8Bbn16eiRrciR7NOickX+zJ0dEz9FgZwkWcpi5nKvm9RcMg7TXS1w3idkmI3kv0ZwXK1uKpNDIxk2y8Xfm0xtmAW9DFj2Qwzaz5I0sOdw55VVDw4sXo+BFy5oUEs4vsmwJ5sCXW3u76gpqn4R9BRwdtbgoM4uK5z3E8x4gMOH1DUaesCdPSM8TIE+QPD4rj7dQQLNtNMtCP8VPztJ0LEOnoOvkdZ28ZpBHJ6vpZNEZs7yM5EySBYNKDksLWYNCNgAj73xNNN3G489j+PNoZh7Nm8fy5LH0PIXf/lcOGhoGBoZtoFsGmmVgZ73YGQ/5tJd8ynBmE1UhCfvyk7CvAK8XmptheFh1JbOTKHhIFE7+o2JoNh7NwqPZv/3z0RcLAxtDtzGwydk6WVsnbRlkLJ1MQceyNco+t69EbEsjl/SSK3L4xm/fA91roXssdK+F5rHQPQXQbcB22hUa2ON/tsHWwNawCxq2pYGtg6VhFTTsnEEha2DldfJUzZdpRiTsy0/CvkI6Oqo37KerYGsUbIP6nukPoGHlDKycASVa0FvL/H4Ih1VXUfvc38yrEW7t2wuhmlwblSFhXyHyAy1EcdLCqQwJ+wppbpbtW4UoZs4c1RXUBwn7CtE0mDtXdRVCuIvfD52dqquoDxL2FbRwoeoKhHCX+fNlMVWlSNhX0Lx5YMieW0KMW7BAdQX1Q8K+grxe6U8KcZTHA729qquoHxL2FSatHCEcvb3yTLeSJOwrTHqUQjikhVNZEvYV5vdDd7fqKoRQS9edgY+oHAl7BWREI+pdV5dzsI+oHAl7BaRvL+rdokWqK6g/EvYKNDRAT4/qKoRQw+uFJUtUV1F/JOwVWb1adQVCqLF0KZjmyd9PlJaEvSLz58u2rqI+rVqluoL6JGGviKbBypWqqxCisnp6nE0BReVJ2Cu0YoWzilCIeiGjenUk7BXy+Zz+pRD1IBSSaccqSdgrJjdqRb047TRZPa6ShL1izc0yDVPUPsNwwl6oI2HvAjK6F7Vu8WJnqxChjoS9C8yfLzMURO3SdTjrLNVVCAl7F9A0OPdc1VUIUR4rV8qaEjeQsHeJefOkdy9qj2nCmWeqrkKAhL2ryOhe1Jq1a6VX7xYS9i7S3i4bRInaEQw6YS/cQcLeZdavd25oCVHtzjpLVoi7icSKy4TDMhVTVL+mJli+XHUV4lgS9i50xhlyio+obvIM1X3k2+FCPp8T+EJUo+5uOY3NjSTsXWr1amhrU12FEDPj8cC73qW6ClGMhL1L6bpz0RiG6kqEmL4NG2QBlVtJ2LtYSwucfbbqKoSYnjlz5EAeN5Owd7m1a6GrS3UVQpyY1wsXX6y6CnEiEvYup2lOO0fmKws3O+8853AS4V4S9lUgEnF6oUK4UW+vc8SmcDcJ+yqxcqVzUQnhJqYp7ZtqIWFfRS6+2Lm4hHCLCy6AhgbVVYjpkLCvIg0NModZuMfq1bB0qeoqxHRJ2FeZBQvgnHNUVyHqXW+vc1NWVA8J+yp0+ukyohLqNDbCpZc6M8VE9ZCwr1IXXQSdnaqrEPXGNOHKK+XeUTWSsK9ShgGXXy5zm0XlaJozom9sVF2JmA3Ntm1bdRFi9oaH4Wc/g1xOdSXV48knv82jj95GNHqY3t513HDDt1i4UG6EnMz558tZC9VMRvZVrqUF3v1u6Z9O1wsv3M29936Rq6/+X3zlKy/T27uOO+64glhsQHVprrZihQR9tZOwrwHz5slh5dP12GPf5MILP8MFF3yKnp6VfOQjd2KaQZ599nuqS3Ot3l648ELVVYhTJWFfI9aulQNPTiafz7Jv30ucdtql46/TdZ0VKy5l167NCitzr54e596QnDpV/eRbWEPWr3emZYri4vEhLKtAODxxGlMk0kk0elhRVe7V1eXMvJFN+GqDhH2NOeccWLdOdRWi2nV0wFVXSdDXEvlW1qCj/ftXX1Vbh9uEQm3ousHYWP+E18di/TQ2yqEBRx0d0Xu9qisRpSQj+xp17rlyytVkHo/JvHln8eabj4+/zrIstm17nEWLZO0/OD3697xHFk3VIhnZ17Azz3RGZ5vl3uO4Sy/9Infd9QkWLDibBQvO4fHH/4FsNsH5539KdWnKzZ3r3IyVc49rk4R9jVuzxgn8X/0KZPkcrF9/PfH4IPff/xfEYofp7T2dz3/+ISKR+t57YvFi2LhRZt3UMllBWyf274fHH4dsVnUlwm3Wr5dpu/VAwr6OxGLw8MMwMqK6EuEGXi9ccgnMn6+6ElEJEvZ1JpeDJ5+EPXtUVyJUikTgiiuguVl1JaJSJOzr1Msvw4svqq5CqNDb6+yn5POprkRUkoR9Hdu71xnlSx+/fqxZAxs2yMZ59UjCvs6NjsIjjzj/F7XL43E2M1u2THUlQhUJe0E268zFf+st1ZWIcujqgosvlkNH6p2EvRh34IAzH39sTHUlohQ8Hmda5erV0rYREvZiklwOnn8etm5VXYk4FV1d8K53ObNuhAAJe3Echw/DU09BNKq6EjETHo+z8+mqVTKaFxNJ2IvjKhSc6ZmvvSZbLVQDGc2LE5GwFyc1OOj08oeGVFciigkGnR1OV6xQXYlwMwl7MW27djkjfZmm6Q6m6ZxMtnq1HDIiTk7CXsyIbcP27fDSSxCPq66mPnk8TsCvWyerYMX0SdiLWbEseOMN+M1vIJVSXU190HVYvhzOOstp3QgxExL24pTk87Bli3MEomy7UD6LFjlz5mVhlJgtCXtREpkMvPmm8yKLskrDNJ2R/MqVEvLi1EnYi5Lbv98J/b17ZcrmbLS1OQG/ZInceBWlI2EvyiaRgG3bnJdEQnU17mYYTqtm1Sro6FBdjahFEvai7GzbGeW/8Yaz/454R1OT06pZvhz8ftXViFomYS8qKpmEffuclwMHnBu89UTToLMTFixwjgOUXryoFAl7oUyhAIcOOcG/d2/tztv3ep3ToebPh3nzZAQv1JCwF64xPPzOqH9w0PllUI103WnPdHU5Ad/T4/TkhVBJwl64kmU52zIMDb3zcuSIswWzm2iac2h3Wxu0tzsvra0S7sJ9JOxF1bBtZ8vlo+E/POzM8kkmnXn+5WSazqrVhgYIhZxAb2tzXmR6pKgGEvaiJliWE/rJpLN9w+T/W5bzy+Lo/23babcc+2IYEAg4oX402BsanD9LoItqJ2EvhBB1QFddgBBCiPKTsBdCiDogYS+EEHVAwl4IIeqAhL0QQtQBCXshhKgDEvZCCFEHJOyFEKIOSNgLIUQdkLAXQog6IGEv6srOnTv57Gc/y6JFi/D7/UQiES644AJuv/12UqmU6vKEKBvZ3knUjQceeIAPfvCD+Hw+Pv7xj7N69Wqy2SxPP/00t9xyC1u3buW73/2u6jKFKAvZCE3Uhd27d7N27Vp6e3t54okn6O7unvD2HTt28MADD3DTTTcpqlCI8pKwF3Xhxhtv5M477+SZZ57h/PPPV12OEBUnYS/qQm9vLz6fj507d6ouRQgl5AatqHmxWIyDBw+yZs0a1aUIoYyEvah5sVgMgHA4rLgSIdSRsBc1LxKJADA2Nqa4EiHUkZ69qAtz5swhEAiwY8cO1aUIoYSM7EVduOaaa9i5cyebN29WXYoQSkjYi7rw5S9/mYaGBj796U/T398/5e07d+7k9ttvV1CZEJUhK2hFXVi8eDE//OEPuf766znttNMmrKB99tlnueeee/jkJz+pukwhykZ69qKuvP3229x22208+uijHDp0CJ/Px9q1a7nhhhv4zGc+g8/nU12iEGUhYS+EEHVAevZCCFEHJOyFEKIOSNgLIUQdkLAXQog6IGEvhBB1QMJeCCHqgIS9EELUAQl7IYSoAxL2QghRByTshRCiDkjYCyFEHZCwF0KIOiBhL4QQdeD/B+rTVMooKQFlAAAAAElFTkSuQmCC",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "venn3([\n",
    "    set(test_1['smiles'].tolist()),\n",
    "    set(test_2['smiles'].tolist()),\n",
    "    set(test_3['smiles'].tolist()),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_1.to_csv('../../data/hi/kdr/train_1.csv')\n",
    "train_2.to_csv('../../data/hi/kdr/train_2.csv')\n",
    "train_3.to_csv('../../data/hi/kdr/train_3.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_1.to_csv('../../data/hi/kdr/test_1.csv')\n",
    "test_2.to_csv('../../data/hi/kdr/test_2.csv')\n",
    "test_3.to_csv('../../data/hi/kdr/test_3.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "lohi_benchmark",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
