{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from matplotlib_venn import venn3\n",
    "import networkx as nx"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "sys.path.append('../../code')\n",
    "\n",
    "import min_vertex_k_cut"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>smiles</th>\n",
       "      <th>value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Brc1ccc(-[n+]2cc[n+](Cc3ccccc3)cc2)c2cc[nH]c12</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Brc1ccc(CNCCN2CCN(Cc3cc4ccccc4[nH]3)CC2)cc1</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Brc1ccc(N2CCN(Cc3ccccc3)CC2)c2cc[nH]c12</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>Brc1ccc(NCCN2CCN(CCc3c[nH]c4ccccc34)CC2)cc1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>Brc1ccc(NCCN2CCN(Cc3cc4ccccc4[nH]3)CC2)cc1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6262</th>\n",
       "      <td>c1cnc(N2CCN(CCCOc3ccc(-c4nc5ccccc5o4)cc3)CC2)nc1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6263</th>\n",
       "      <td>c1cnc(N2CCN(CCCSc3nc4ccccc4s3)CC2)nc1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6264</th>\n",
       "      <td>c1cnc(N2CCN(Cc3c[nH]c4ncccc34)CC2)nc1</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6265</th>\n",
       "      <td>c1cncc(CN[C@H]2C3C4CC5C6C4CC3C6C52)c1</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6266</th>\n",
       "      <td>c1nc2c(s1)CCN(CCCCN1CCc3ncsc3CC1)CC2</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>6267 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                smiles  value\n",
       "0       Brc1ccc(-[n+]2cc[n+](Cc3ccccc3)cc2)c2cc[nH]c12   True\n",
       "1          Brc1ccc(CNCCN2CCN(Cc3cc4ccccc4[nH]3)CC2)cc1  False\n",
       "2              Brc1ccc(N2CCN(Cc3ccccc3)CC2)c2cc[nH]c12   True\n",
       "3          Brc1ccc(NCCN2CCN(CCc3c[nH]c4ccccc34)CC2)cc1   True\n",
       "4           Brc1ccc(NCCN2CCN(Cc3cc4ccccc4[nH]3)CC2)cc1   True\n",
       "...                                                ...    ...\n",
       "6262  c1cnc(N2CCN(CCCOc3ccc(-c4nc5ccccc5o4)cc3)CC2)nc1   True\n",
       "6263             c1cnc(N2CCN(CCCSc3nc4ccccc4s3)CC2)nc1   True\n",
       "6264             c1cnc(N2CCN(Cc3c[nH]c4ncccc34)CC2)nc1  False\n",
       "6265             c1cncc(CN[C@H]2C3C4CC5C6C4CC3C6C52)c1  False\n",
       "6266              c1nc2c(s1)CCN(CCCCN1CCc3ncsc3CC1)CC2  False\n",
       "\n",
       "[6267 rows x 2 columns]"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "drd2_hi = pd.read_csv('../../data/raw/drd2_hi.csv', index_col=0)\n",
    "drd2_hi"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "smiles = drd2_hi['smiles'].to_list()\n",
    "threshold = 0.4\n",
    "\n",
    "neighborhood_graph = min_vertex_k_cut.get_neighborhood_graph(smiles, threshold)\n",
    "main_component, small_components = min_vertex_k_cut.get_main_component(neighborhood_graph)\n",
    "\n",
    "old_nodes_to_new = dict(zip(main_component.nodes(), range(main_component.number_of_nodes())))\n",
    "new_nodes_to_old = {v: k for k, v in old_nodes_to_new.items()}\n",
    "main_component = nx.relabel_nodes(main_component, old_nodes_to_new)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.9 5160 86.87093023255814\n",
      "0.8 3696 56.81547619047619\n",
      "0.7 1963 34.751910341314314\n",
      "0.6 1128 24.48049645390071\n",
      "0.5 648 17.126543209876544\n",
      "0.4 387 11.534883720930232\n"
     ]
    }
   ],
   "source": [
    "for coarse_threhold in [0.90, 0.80, 0.70, 0.60, 0.50, 0.40]:\n",
    "    coarsed_main_component, _ = min_vertex_k_cut.coarse_graph(main_component, coarse_threhold)\n",
    "    node_degrees = list(dict(coarsed_main_component.degree()).values())\n",
    "    print(coarse_threhold, len(coarsed_main_component), np.mean(node_degrees))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "coarsed_main_component, node_to_cluster = min_vertex_k_cut.coarse_graph(main_component, 0.4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total molecules: 6082\n",
      "Min size of a partition: 1094\n",
      "Welcome to the CBC MILP Solver \n",
      "Version: Trunk\n",
      "Build Date: Oct 24 2021 \n",
      "\n",
      "Starting solution of the Linear programming relaxation problem using Primal Simplex\n",
      "\n",
      "Coin0506I Presolve 12621 (-1161) rows, 1161 (0) columns and 26784 (-2322) elements\n",
      "Clp1000I sum of infeasibilities 7.43375e-07 - average 5.88998e-11, 0 fixed columns\n",
      "Coin0506I Presolve 12621 (0) rows, 1161 (0) columns and 26784 (0) elements\n",
      "Clp0029I End of values pass after 1161 iterations\n",
      "Clp0000I Optimal - objective value 6082\n",
      "Clp0000I Optimal - objective value 6082\n",
      "Clp0000I Optimal - objective value 6082\n",
      "Coin0511I After Postsolve, objective 6082, infeasibilities - dual 0 (0), primal 0 (0)\n",
      "Clp0032I Optimal objective 6082 - 0 iterations time 0.642, Presolve 0.01, Idiot 0.63\n",
      "\n",
      "Starting MIP optimization\n",
      "Cgl0003I 0 fixed, 0 tightened bounds, 10464 strengthened rows, 0 substitutions\n",
      "Cgl0003I 0 fixed, 0 tightened bounds, 1714 strengthened rows, 0 substitutions\n",
      "Cgl0003I 0 fixed, 0 tightened bounds, 53 strengthened rows, 0 substitutions\n",
      "Cgl0004I processed model has 10811 rows, 1161 columns (1161 integer (1161 of which binary)) and 33585 elements\n",
      "Coin3009W Conflict graph built in 0.002 seconds, density: 0.497%\n",
      "Cgl0015I Clique Strengthening extended 0 cliques, 0 were dominated\n",
      "Cbc0045I Nauty: 13928 orbits (9 useful covering 18 variables), 3 generators, group size: 8 - sparse size 101394 - took 0.056423 seconds\n",
      "Cbc0038I Initial state - 1161 integers unsatisfied sum - 278.447\n",
      "Cbc0038I Pass   1: (1.73 seconds) suminf.   87.13622 (284) obj. -4237.52 iterations 3245\n",
      "Cbc0038I Pass   2: (1.81 seconds) suminf.   46.85362 (110) obj. -3548.02 iterations 460\n",
      "Cbc0038I Pass   3: (1.82 seconds) suminf.   40.04460 (97) obj. -3488.52 iterations 61\n",
      "Cbc0038I Pass   4: (1.82 seconds) suminf.   37.89598 (95) obj. -3484.44 iterations 23\n",
      "Cbc0038I Pass   5: (1.83 seconds) suminf.   36.91035 (94) obj. -3475.11 iterations 48\n",
      "Cbc0038I Pass   6: (1.85 seconds) suminf.   33.49012 (82) obj. -3357.47 iterations 97\n",
      "Cbc0038I Pass   7: (1.86 seconds) suminf.   32.78893 (83) obj. -3358 iterations 76\n",
      "Cbc0038I Pass   8: (1.87 seconds) suminf.   30.07705 (73) obj. -3341.38 iterations 82\n",
      "Cbc0038I Pass   9: (1.88 seconds) suminf.   30.00715 (73) obj. -3341.74 iterations 34\n",
      "Cbc0038I Pass  10: (1.89 seconds) suminf.   29.89931 (77) obj. -3345.81 iterations 69\n",
      "Cbc0038I Pass  11: (1.90 seconds) suminf.   30.00715 (73) obj. -3341.74 iterations 61\n",
      "Cbc0038I Pass  12: (1.99 seconds) suminf.   58.39230 (167) obj. -3282 iterations 533\n",
      "Cbc0038I Pass  13: (2.05 seconds) suminf.   28.39067 (74) obj. -3282 iterations 310\n",
      "Cbc0038I Pass  14: (2.05 seconds) suminf.   27.25817 (74) obj. -3282 iterations 28\n",
      "Cbc0038I Pass  15: (2.06 seconds) suminf.   25.16452 (78) obj. -3282 iterations 54\n",
      "Cbc0038I Pass  16: (2.07 seconds) suminf.   24.51957 (66) obj. -3282 iterations 30\n",
      "Cbc0038I Pass  17: (2.08 seconds) suminf.   24.50153 (69) obj. -3282 iterations 12\n",
      "Cbc0038I Pass  18: (2.09 seconds) suminf.   23.21391 (69) obj. -3282 iterations 61\n",
      "Cbc0038I Pass  19: (2.10 seconds) suminf.   22.84212 (63) obj. -3282 iterations 30\n",
      "Cbc0038I Pass  20: (2.11 seconds) suminf.   22.71025 (61) obj. -3282 iterations 24\n",
      "Cbc0038I Pass  21: (2.11 seconds) suminf.   22.03717 (65) obj. -3282 iterations 47\n",
      "Cbc0038I Pass  22: (2.12 seconds) suminf.   21.93805 (62) obj. -3282 iterations 21\n",
      "Cbc0038I Pass  23: (2.13 seconds) suminf.   18.05764 (55) obj. -3282 iterations 67\n",
      "Cbc0038I Pass  24: (2.14 seconds) suminf.   17.40644 (48) obj. -3282 iterations 24\n",
      "Cbc0038I Pass  25: (2.15 seconds) suminf.   14.03074 (44) obj. -3282 iterations 73\n",
      "Cbc0038I Pass  26: (2.16 seconds) suminf.   13.67773 (43) obj. -3282 iterations 33\n",
      "Cbc0038I Pass  27: (2.17 seconds) suminf.   13.89980 (50) obj. -3282 iterations 46\n",
      "Cbc0038I Pass  28: (2.18 seconds) suminf.   13.50581 (40) obj. -3282 iterations 35\n",
      "Cbc0038I Pass  29: (2.19 seconds) suminf.   13.22794 (47) obj. -3282 iterations 47\n",
      "Cbc0038I Pass  30: (2.20 seconds) suminf.   12.99241 (51) obj. -3282 iterations 28\n",
      "Cbc0038I No solution found this major pass\n",
      "Cbc0038I Before mini branch and bound, 0 integers at bound fixed and 0 continuous\n",
      "Cbc0038I Full problem 10811 rows 1161 columns, reduced to 10811 rows 1161 columns - too large\n",
      "Cbc0038I Mini branch and bound did not improve solution (2.23 seconds)\n",
      "Cbc0038I After 2.75 seconds - Feasibility pump exiting - took 1.89 seconds\n",
      "Cbc0013I At root node, 0 cuts changed objective from -6082 to -6082 in 1 passes\n",
      "Cbc0014I Cut generator 0 (Probing) - 0 row cuts average 0.0 elements, 0 column cuts (0 active)  in 0.028 seconds - new frequency is -100\n",
      "Cbc0014I Cut generator 1 (Gomory) - 0 row cuts average 0.0 elements, 0 column cuts (0 active)  in 0.046 seconds - new frequency is -100\n",
      "Cbc0014I Cut generator 2 (Knapsack) - 0 row cuts average 0.0 elements, 0 column cuts (0 active)  in 0.004 seconds - new frequency is -100\n",
      "Cbc0014I Cut generator 3 (Clique) - 0 row cuts average 0.0 elements, 0 column cuts (0 active)  in 0.015 seconds - new frequency is -100\n",
      "Cbc0014I Cut generator 4 (OddWheel) - 0 row cuts average 0.0 elements, 0 column cuts (0 active)  in 0.180 seconds - new frequency is -100\n",
      "Cbc0014I Cut generator 5 (MixedIntegerRounding2) - 0 row cuts average 0.0 elements, 0 column cuts (0 active)  in 0.007 seconds - new frequency is -100\n",
      "Cbc0014I Cut generator 6 (FlowCover) - 0 row cuts average 0.0 elements, 0 column cuts (0 active)  in 0.000 seconds - new frequency is -100\n",
      "Cbc0010I After 0 nodes, 1 on tree, 1e+50 best solution, best possible -6082 (6.01 seconds)\n",
      "Cbc0010I After 2 nodes, 1 on tree, 1e+50 best solution, best possible -6081.6401 (7.21 seconds)\n",
      "Cbc0010I After 3 nodes, 2 on tree, 1e+50 best solution, best possible -6081.6401 (8.53 seconds)\n",
      "Cbc0010I After 4 nodes, 2 on tree, 1e+50 best solution, best possible -6081.6401 (11.96 seconds)\n",
      "Cbc0010I After 5 nodes, 2 on tree, 1e+50 best solution, best possible -6081.6401 (13.04 seconds)\n",
      "Cbc0010I After 7 nodes, 1 on tree, 1e+50 best solution, best possible -6081.6401 (14.22 seconds)\n",
      "Cbc0010I After 8 nodes, 2 on tree, 1e+50 best solution, best possible -6081.6401 (15.12 seconds)\n",
      "Cbc0010I After 10 nodes, 1 on tree, 1e+50 best solution, best possible -6081.28 (16.72 seconds)\n",
      "Cbc0010I After 12 nodes, 2 on tree, 1e+50 best solution, best possible -6081.28 (17.91 seconds)\n",
      "Cbc0010I After 13 nodes, 2 on tree, 1e+50 best solution, best possible -6081.28 (18.69 seconds)\n",
      "Cbc0010I After 16 nodes, 1 on tree, 1e+50 best solution, best possible -6081.28 (20.62 seconds)\n",
      "Cbc0010I After 19 nodes, 2 on tree, 1e+50 best solution, best possible -6081.28 (21.54 seconds)\n",
      "Cbc0010I After 22 nodes, 1 on tree, 1e+50 best solution, best possible -6081.28 (22.83 seconds)\n",
      "Cbc0010I After 25 nodes, 2 on tree, 1e+50 best solution, best possible -6081.28 (23.89 seconds)\n",
      "Cbc0010I After 27 nodes, 2 on tree, 1e+50 best solution, best possible -6081.28 (25.65 seconds)\n",
      "Cbc0010I After 30 nodes, 4 on tree, 1e+50 best solution, best possible -6081.28 (26.76 seconds)\n",
      "Cbc0010I After 33 nodes, 6 on tree, 1e+50 best solution, best possible -6080.9197 (27.89 seconds)\n",
      "Cbc0010I After 36 nodes, 9 on tree, 1e+50 best solution, best possible -6080.9197 (28.60 seconds)\n",
      "Cbc0010I After 39 nodes, 12 on tree, 1e+50 best solution, best possible -6080.9197 (29.53 seconds)\n",
      "Cbc0010I After 44 nodes, 16 on tree, 1e+50 best solution, best possible -6080.9197 (30.31 seconds)\n",
      "Cbc0010I After 47 nodes, 18 on tree, 1e+50 best solution, best possible -6080.9197 (31.20 seconds)\n",
      "Cbc0010I After 51 nodes, 20 on tree, 1e+50 best solution, best possible -6080.9197 (32.14 seconds)\n",
      "Cbc0010I After 54 nodes, 21 on tree, 1e+50 best solution, best possible -6080.9197 (33.00 seconds)\n",
      "Cbc0010I After 62 nodes, 27 on tree, 1e+50 best solution, best possible -6080.9197 (34.00 seconds)\n",
      "Cbc0010I After 68 nodes, 32 on tree, 1e+50 best solution, best possible -6080.9197 (34.78 seconds)\n",
      "Cbc0010I After 70 nodes, 34 on tree, 1e+50 best solution, best possible -6080.9197 (35.69 seconds)\n",
      "Cbc0010I After 74 nodes, 37 on tree, 1e+50 best solution, best possible -6080.9197 (36.81 seconds)\n",
      "Cbc0010I After 77 nodes, 39 on tree, 1e+50 best solution, best possible -6080.9197 (37.60 seconds)\n",
      "Cbc0010I After 81 nodes, 42 on tree, 1e+50 best solution, best possible -6080.9197 (38.39 seconds)\n",
      "Cbc0010I After 84 nodes, 43 on tree, 1e+50 best solution, best possible -6080.9197 (39.11 seconds)\n",
      "Cbc0010I After 88 nodes, 46 on tree, 1e+50 best solution, best possible -6080.9197 (39.98 seconds)\n",
      "Cbc0010I After 95 nodes, 50 on tree, 1e+50 best solution, best possible -6080.9197 (40.73 seconds)\n",
      "Cbc0010I After 101 nodes, 56 on tree, 1e+50 best solution, best possible -6080.9197 (41.48 seconds)\n",
      "Cbc0010I After 107 nodes, 60 on tree, 1e+50 best solution, best possible -6080.9197 (42.37 seconds)\n",
      "Cbc0010I After 115 nodes, 66 on tree, 1e+50 best solution, best possible -6080.9197 (43.13 seconds)\n",
      "Cbc0010I After 118 nodes, 68 on tree, 1e+50 best solution, best possible -6080.9197 (43.93 seconds)\n",
      "Cbc0010I After 125 nodes, 73 on tree, 1e+50 best solution, best possible -6080.9197 (44.77 seconds)\n",
      "Cbc0010I After 134 nodes, 77 on tree, 1e+50 best solution, best possible -6080.9197 (45.63 seconds)\n",
      "Cbc0010I After 139 nodes, 81 on tree, 1e+50 best solution, best possible -6080.9197 (46.53 seconds)\n",
      "Cbc0010I After 145 nodes, 85 on tree, 1e+50 best solution, best possible -6080.9197 (47.34 seconds)\n",
      "Cbc0010I After 155 nodes, 88 on tree, 1e+50 best solution, best possible -6080.9197 (48.06 seconds)\n",
      "Cbc0010I After 160 nodes, 91 on tree, 1e+50 best solution, best possible -6080.9197 (48.84 seconds)\n",
      "Cbc0010I After 168 nodes, 98 on tree, 1e+50 best solution, best possible -6080.9197 (49.64 seconds)\n",
      "Cbc0010I After 176 nodes, 104 on tree, 1e+50 best solution, best possible -6080.9197 (50.59 seconds)\n",
      "Cbc0010I After 186 nodes, 109 on tree, 1e+50 best solution, best possible -6080.9197 (51.33 seconds)\n",
      "Cbc0010I After 193 nodes, 115 on tree, 1e+50 best solution, best possible -6080.9197 (52.18 seconds)\n",
      "Cbc0010I After 206 nodes, 123 on tree, 1e+50 best solution, best possible -6080.9197 (53.06 seconds)\n",
      "Cbc0010I After 217 nodes, 132 on tree, 1e+50 best solution, best possible -6080.9197 (53.96 seconds)\n",
      "Cbc0010I After 226 nodes, 136 on tree, 1e+50 best solution, best possible -6080.9197 (54.74 seconds)\n",
      "Cbc0010I After 239 nodes, 144 on tree, 1e+50 best solution, best possible -6080.9197 (55.47 seconds)\n",
      "Cbc0010I After 251 nodes, 149 on tree, 1e+50 best solution, best possible -6080.9197 (56.27 seconds)\n",
      "Cbc0010I After 268 nodes, 155 on tree, 1e+50 best solution, best possible -6080.9197 (57.12 seconds)\n",
      "Cbc0010I After 289 nodes, 168 on tree, 1e+50 best solution, best possible -6080.9197 (57.95 seconds)\n",
      "Cbc0010I After 309 nodes, 174 on tree, 1e+50 best solution, best possible -6080.9197 (58.67 seconds)\n",
      "Cbc0010I After 328 nodes, 173 on tree, 1e+50 best solution, best possible -6080.9197 (59.46 seconds)\n",
      "Cbc0010I After 351 nodes, 181 on tree, 1e+50 best solution, best possible -6080.9197 (60.19 seconds)\n",
      "Cbc0004I Integer solution of -3284 found after 156839 iterations and 377 nodes (60.90 seconds)\n",
      "Cbc0012I Integer solution of -3284 found by heuristic after 157558 iterations and 378 nodes (60.90 seconds)\n",
      "Cbc0010I After 379 nodes, 197 on tree, -3284 best solution, best possible -6080.9197 (60.90 seconds)\n",
      "Cbc0004I Integer solution of -3284 found after 154323 iterations and 346 nodes (60.97 seconds)\n",
      "Cbc0012I Integer solution of -3390 found by heuristic after 157640 iterations and 380 nodes (61.91 seconds)\n",
      "Cbc0030I Thread 0 used 30 times,  waiting to start 0.8841145,  149 locks, 0.0011029243 locked, 3.2901764e-05 waiting for locks\n",
      "Cbc0030I Thread 1 used 29 times,  waiting to start 1.3851204,  142 locks, 0.001131773 locked, 3.2901764e-05 waiting for locks\n",
      "Cbc0030I Thread 2 used 24 times,  waiting to start 3.2346435,  119 locks, 0.0010251999 locked, 3.0994415e-05 waiting for locks\n",
      "Cbc0030I Thread 3 used 25 times,  waiting to start 6.8744073,  123 locks, 0.00096821785 locked, 3.0994415e-05 waiting for locks\n",
      "Cbc0030I Thread 4 used 26 times,  waiting to start 8.0865619,  129 locks, 0.0010609627 locked, 0.00019717216 waiting for locks\n",
      "Cbc0030I Thread 5 used 22 times,  waiting to start 9.1470482,  112 locks, 0.0051388741 locked, 2.5987625e-05 waiting for locks\n",
      "Cbc0030I Thread 6 used 29 times,  waiting to start 10.768192,  142 locks, 0.0012004375 locked, 3.8862228e-05 waiting for locks\n",
      "Cbc0030I Thread 7 used 29 times,  waiting to start 12.052212,  144 locks, 0.001139164 locked, 3.7908554e-05 waiting for locks\n",
      "Cbc0030I Thread 8 used 23 times,  waiting to start 12.688021,  111 locks, 0.0012397766 locked, 2.9325485e-05 waiting for locks\n",
      "Cbc0030I Thread 9 used 22 times,  waiting to start 13.536081,  109 locks, 0.00085425377 locked, 2.5749207e-05 waiting for locks\n",
      "Cbc0030I Thread 10 used 23 times,  waiting to start 13.976015,  113 locks, 0.0037610531 locked, 3.1471252e-05 waiting for locks\n",
      "Cbc0030I Thread 11 used 18 times,  waiting to start 15.62985,  87 locks, 0.00079250336 locked, 2.2649765e-05 waiting for locks\n",
      "Cbc0030I Thread 12 used 23 times,  waiting to start 15.925876,  114 locks, 0.00095057487 locked, 3.027916e-05 waiting for locks\n",
      "Cbc0030I Thread 13 used 28 times,  waiting to start 16.534795,  138 locks, 0.0012464523 locked, 3.3140182e-05 waiting for locks\n",
      "Cbc0030I Thread 14 used 18 times,  waiting to start 16.473678,  89 locks, 0.00069880486 locked, 1.7166138e-05 waiting for locks\n",
      "Cbc0030I Thread 15 used 26 times,  waiting to start 16.781872,  128 locks, 0.0010666847 locked, 2.9802322e-05 waiting for locks\n",
      "Cbc0030I Main thread 54.80454 waiting for threads,  862 locks, 0.00091266632 locked, 4.3153763e-05 waiting for locks\n",
      "Cbc0011I Exiting as integer gap of 2690.9197 less than 1e-10 or 50%\n",
      "Cbc0045I Orbital branching succeeded 37 times - average extra   0.027, fixing (0,   0.000)\n",
      "Cbc0001I Search completed - best objective -3390, took 157640 iterations and 380 nodes (61.92 seconds)\n",
      "Cbc0032I Strong branching done 7196 times (527182 iterations), fathomed 16 nodes and fixed 36 variables\n",
      "Cbc0035I Maximum depth 30, 0 variables fixed on reduced cost\n",
      "Total time (CPU seconds):       701.36   (Wallclock seconds):       62.43\n",
      "\n"
     ]
    }
   ],
   "source": [
    "model = min_vertex_k_cut.trisect_connected_graph(coarsed_main_component, part_min_frac=0.18, emphasis=1, max_mip_gap=0.5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<OptimizationStatus.OPTIMAL: 0>"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.status"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[2692 1098 1194 1098]\n"
     ]
    }
   ],
   "source": [
    "split = min_vertex_k_cut.process_trisect_results(model, coarsed_main_component, main_component, node_to_cluster)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "first_idx = []\n",
    "second_idx = []\n",
    "third_idx = []\n",
    "\n",
    "for S_idx, partition in enumerate(split):\n",
    "    G_idx = new_nodes_to_old[S_idx]\n",
    "    if partition == 0:\n",
    "        first_idx.append(G_idx)\n",
    "    if partition == 1:\n",
    "        second_idx.append(G_idx)\n",
    "    if partition == 2:\n",
    "        third_idx.append(G_idx)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "for component in small_components:\n",
    "    i = np.argmin([len(first_idx), len(second_idx), len(third_idx)])\n",
    "    if i == 0:\n",
    "        first_idx.extend(component)\n",
    "    if i == 1:\n",
    "        second_idx.extend(component)\n",
    "    if i == 2:\n",
    "        third_idx.extend(component)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[1191, 1194, 1190]"
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "[len(first_idx), len(second_idx), len(third_idx)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [],
   "source": [
    "part_first = drd2_hi.iloc[first_idx]\n",
    "part_second = drd2_hi.iloc[second_idx]\n",
    "part_third = drd2_hi.iloc[third_idx]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<matplotlib_venn._common.VennDiagram at 0x7f65a3cdd300>"
      ]
     },
     "execution_count": 21,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAgMAAADVCAYAAADKI/NMAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAqF0lEQVR4nO3deXBc1Z0v8G+3Wt1Sa99sWdZuIVuSgw3ejW2sWEAMhkzxIDaPmQyuhOdHhUmACszkDfUySQ1TM8kkQ4bxFJVKZkwFBSbwnDwIycMGGYQX4g1jvEiyZGtfrNaubkmtVvf74yDbMrLV+zn33u+nqss4Lal/cs6993vPdk0+n88HIiIiMiyz7AKIiIhILoYBIiIig2MYICIiMjiGASIiIoNjGCAiIjI4hgEiIiKDYxggIiIyOIYBIiIig2MYICIiMjiGASIiIoNjGCAiIjI4hgEiIiKDYxggIiIyOIYBIiIig2MYICIiMjiGASIiIoNjGCAiIjI4hgEiIiKDYxggIiIyOIYBIiIig2MYICIiMjiGASIiIoNjGCAiIjI4hgEiIiKDYxggIiIyOIYBIiIig2MYICIiMjiGASIiIoNjGCAiIjI4hgEiIiKDYxggIiIyOIvsAgzJ5wOGhgCXS7yczqv/7XIBY2PA1BTg9YoXAJjNgMkExMQANhuQkADY7TNfCQlAcjJg4f+tRjfuGUf/WD+cbidck64ZL+ekE+OecUx5p+CDD16faGNmkxkmmBBjjkGcJQ72WPuMV0JsAuyxdqTFp8Eea5f8G5JsXi8wMnLj09j4+NVT2LWnMbNZnMbi4794CrPbgcRE8aLoMvl8Pp/sInTN5wMGBgCHQ7x6e4G+PsDjicznmc1AaiqQlQVkZoo/09MZEHRs3DOOXmcvHC4Hel3iz1H3aEQ/0x5rR5Y9C5n2TGQliD8ZEPTL6wUGB8Xpq7dXnMr6+sQ9SyRYreL0NX0Ky8wEUlIi81kkMAxEQn8/0NwMtLeLoyZSF35/TQeEhQuBggJgwQLRy0Ca5PF60DHcgZahFrQPt0f8wu8ve6wducm5KEgpQF5KHixmBlAt6+0FWlrEaSySF35/TQeEvDxxGktNlVuP3jAMhIPXC3R1iSOnpUX0nanMZhNHVGEhkJsrjjJS2tjkGFqGWtAy2IKOkQ54vJID5hxiTDHIScpBQWoBClIKkGBNkF0SzWFqCujouHoac7lkV3RzKSkiFBQUANnZvL8JFcNAKLq7gfPnxZHjdsuuJjhmM5CTAyxZIsKBmXNKVTHlnULTQBPqHHXoHu2WXU5IsuxZWJK5BLdk3MIeA4X4fOLOv64OaGuT34kZrLg4EQrKyoB582RXo00MA4GanAQuXADOnRPDAXpit4tQUFYmJiOSFMMTwzjfex71ffUY94zLLiesrDFWlGaUojyrHKlxqbLLMazxcaC+XtzLDA/Lria8MjOB8nKgpIRTpQLBMOCvgQERAC5c0G4vgL/MZhGzy8vFPAOKOJ/Ph7bhNpy9fBbtw+3wQf+HZU5SDsqzylGYWgiziT1S0XD5MnD2LHDxovw5AJFmswGlpeI0xsmHc2MYmMvAAHDsmJgQaESZmcDq1WJuAUVEy2ALjnUeQ/+Yznqa/JRiS8HKnJVYlL5Idim61d0NHD0q/jSi4mJg1SqGgpthGLiR0VHg+HHRE8B/IjGvYPVqDsiFUfdoN452HNX8fIBwybRnYvXC1chNZvAMl/5+cS/T0iK7EvnMZtFTsHKlGBGlmRgGrjc+DnzyiRgS0Hs/WjCKikTE5rqeoPWP9eNox1G0DrXKLkVJOUk5WLNwDbISsmSXolm8l7kxiwVYuhRYvpwLqa7FMDDN5wM++ww4eVL/cwJCZTKJSYarV/NoCoB7yo2P2z9GvaPeEHMCQlWSXoL1eesRZ4mTXYpmeDzAiRPAmTO8l5mLzQasWCGCATEMCIODwIcfAj09sivRlsREYNMmzifwQ9tQG2pbauGcdMouRVPiLHHYkL8BxWnFsktRXk8P8MEHYqdz8l92NrB5s9jJ3ciMHQamewOOHWOMDsWSJcDatewlmIV7yo0jbUdQ31cvuxRNK04rxob8DewlmIXHI4YEPvuMQwLBslhER6eRewmMGwbYGxBe7CX4AvYGhBd7Cb6IvQHhZeReAmOGgfPngcOH2RsQCeXlwPr1ht7J0Ovz4nDbYZzrPSe7FF26Jf0WbCzYaOidDH0+0Rtw6hR7A8LNYhGnsCVLZFcSXcYKA16vCAHneJKOqAULgLvuEnuEGsy4Zxz7m/aja7RLdim6lmXPwt2L7jbkMw/cbqCmBmjlYpSIqqgA1q0zzn2NccLA+Djw3ntAZ6fsSowhMRG45x4gI0N2JVHTP9aPdxvfxYhb8QdV6YQ91o67F92NeQnG2ftiaAh4910xykmRt3AhUFUlVh7onTHCQH+/OIJUf5qg3lgsQGWl2JtA5y4NXMKB5gPKP01Qb2JMMdhYsBGlGaWyS4m49nbg/feBiQnZlRhLcrK4r0lLk11JZOk/DDQ3AwcOiAcMkRwrVoiXTp3oPIETXSdkl2Fot86/FWsWroFJp8+xPXMGOHKE8wNkiY0Fvvxl8cgWvdJ3GKivB2preQSpoKwM2LhRdhVhd7D1ICcKKqIkvQSVhZW6CwRHj4qJgiSXyQTceafY0liP9BsGzp0DDh6UXQVdq7RUHE06OFn7fD7UttRy/wDFFKUWYUvxFt08BfHwYdErQOrYuFHc2+iNPsPAmTPiKCL1lJSIeQQaDgQ+nw8ftnyIhr4G2aXQLApSCnDXors0HwgOHuTCJ1XdcYdYbaAn2j5aZnPuHIOAyhobxWZPGvZR60cMAgprGWpBzaUaaPk+hyug1XboEFBXJ7uK8NJXGGho4NCAFjQ0AB99JLuKoBxqPYQ6h87OAjp0ceAiDjQf0GQgOHqUQwNa8NFH4qmQeqGfMNDervk7TkM5f148IVJDPu3+FGd7z8oug/zU2N+IY53HZJcRkLNnOVlQK3w+sRV0R4fsSsJDH2FgaEhsKKTBuwBDO35cLP3UgNahVhztOCq7DArQqe5TaOxvlF2GXzo6xPJB0g6fT1x6hodlVxI67YcBt1tsKOR2y66EglFTIzaFUtjg+KAYgwbDphZ92Pwhep29ssu4qeFhcVHxemVXQoGamBCXIK1vZaPtMODziS25uDendnk84kgaH5ddyawmPBN4t/FduKcYNrVqyjeFfU374Jp0yS5lVpOT4hDgzoLaNTAgLkVa7pzWdhj405+AtjbZVVCoRkaA/fuVuy3y+Xx4/9L7GJrg82G1zjnpxL6mfZjyqvWk0un7mYEB2ZVQqFpbgWPamqIyg3bDQFMTcPq07CooXLq6lBswPdpxFO3D7bLLoDC57LyMQ22HZJcxw4kTfPqgnpw6BVy8KLuK4GgzDLhcml2aRjdx9qxYFaKA7tFunO5h2NSbOkcdWofUuPpevgx88onsKijcPvpIXKK0RpthoLaWEwb1qrZW+kwcj9eDD5s/5IRBnaptqZU+B2RqSixL0/IYM81uYkKb291oLww0NLBfTc9GR4GPP5ZawrGOY5wnoGOuSRcOt8ndpfT4cc571rPmZrHZqpZoKwy4XNxq2AjOn5c2XNA92o0zl7n9m9419DVIGy64fJnTnYzg0CFtDRdoKwxweMA4JAwXeLwefND8AYcHDELGcAGHB4xjYkJbU9u0EwYaGzk8YCSjo2LpaBSd6DyB4QkdbCVGfnFNuvBxe3SHpE6e5PCAkbS0iIVvWqCNMOD1ansBJwWnrk5sNR0Fo+5RDg8YUL2jHgNj0Vnk73QCn30WlY8ihRw9qtwWKrPSRhg4d05sTEPGEsUQeKLzBKZ8am1IQ5Hngy9qDzM6cUJsuEnGMjKijcdRqx8GJic193Q7CqOLF4HeyO4rPzA2gIa+hoh+BqmrebAZPaM9Ef2MwUGgvj6iH0EK++QT6Sum56R+GDh9Wtl96ylKjkb2aYHHOo9x0qDBRfqJlMePc9KgkY2NqT9EpHYYGBvjGhwSz3aN0EPDe0Z70DzYHJGfTdrRNdqFtqHIPOekt1e7W9RS+Hz6qdr3tWqHAS30rVB0RKh3IFrjxaS+SPUORLhjizRiclLt7afVDQNut5hNTgSI26uurrD+SIfLgc6RzrD+TNKuvrE+dAyHtweqry9inVqkQXV16t7fqhsGGho49ZZmOns2rD/uXK8GpvhSVIW7TWhhFjlFz+SkuLSpSN0wwKOIrtfcHLb9Pd1TbjT2a2zzcIq4lqEWON3OsPwstxu4cCEsP4p0RNVLm5phoLOT23TRF3m9YRs6qnfUw+NlzxPN5PV5cd5xPiw/i52bNJuBAXGJU42aYUDV6ETy1dWFZY0WhwjoRuocdfD6Qt8yjqcxuhEV24Z6YcDlEt3BRLMZHRUbfoegY7iDjyimG3JNukJebsrOTbqZMI54ho16YaChQRsbOZM8IQ4V1PdxKzi6uTpHaG2MC6HoZrxe9SYSqhcG2CtAc+noCHow1uvzSnuOPWlH50gnJqeCWwPm9fIBqzQ31S51aoWBsTHg8mXZVZDqpqaA9vagvrVrpCvqz7An7fH6vGgbDm5Hwu5usZKA6GZ6e8UlTxVqhYEQx4LJQIKM1S1DbGPkn5bB4NqKand8pCafT61LHsMAaVNra1CrCoI9wZPxtA61whdEG+MQAflLpbaiThjweLhvJ/lvfBzoCeyxs/1j/Rhxj0SoINKbiakJdI92B/Q9AwPA8HCECiLdaW8Xo54qUCcMhDApjAwqwJ4k9gpQoAIdVmLnJgVCpXtgtcIAUSACbDMdI2xjFJhAH1zE0xgFSpU2o04YcDhkV0Ba098f0J4UDhfbGAVmYHwAU17/+3F7eyNYDOmSKm1GjTDg8zEMUOC8XhEI/DA8McwlhRQwr8+L/jE/29gwlxRS4Pr6wrLDesjUCAODg5wvQMHxM1azV4CC1evys42xiVEQJieBIQV2R1cjDPAoomD52XZ6nYr0xZHm+BskVenuJe1Roe2oEQZU+JcgbfKz7fh7d0d0PX+DJE9jFCwV7ofVCAMq/EuQNvk5iZDDBBQsfycR8jRGwVIhSKoRBvisTwqW1zvnLi+uSRcnD1LQvD4vhifmaGMuTh6k4KlwCZQfBrxesZscUbDmeDC4a1KxB4eT5szVhlR7Nj1py/h4QKukI0J+GOBRRKFiGKAIYxigSJPdhuSHAadTdgWkdQwDFGHOyZufp2SfyEn7ZLch+WFA9r8Aad8cgZJhgEI1VxviPQ2FSval0CL34yH/XyAKahsa8ON9+3CitRVdQ0P47RNP4M+WL7/y/t6TJ/FybS1OtLai3+nEJ88/j+V5eTN+RlNvL7775ps42NiICY8HX6mowEs7dmB+cvKVr3nhD3/AO599hlNtbbBaLBh88cUo/YaSzdGGnG79n6kbTjZg36/2ofV8K4YcQ3jin5/A8s3Lr7x/suYkav9PLVrrWuEccuL56ueRt3hmG+tt78WbL76JxlON8Ex6ULGuAjue3YHkjGRcb9I9iX987B/R3tA+68/SGw4TAA0Ntdi378dobT2BoaEuPPHEb7F8+Z9def/kyb2orX0Zra0n4HT24/nnP0Fe3vIZP6O3twlvvvldNDYehMczgYqKr2DHjpeQnDz/ytc4nf14/fW/wunTb8NkMuP22/8bvva1nyEuLjFKv6kcsgMlewaiwOl2Y1luLnY/8sgN399QUoJ/evDB2d+fmMDdL74IE4CaZ57Boeeeg9vjwf27d8N7zawTt8eDh1eswBN33hmJX0NdHCaAe8yN3Fty8chfz97G3GNulCwvwYN/NXsbmxibwIvfehEwAc+8/Aye++Vz8Ex6sPvpmW1s2t5/3YvUzNQw/gZqYxgA3G4ncnOX4ZFHdt/w/ZKSDXjwwX+a9f2JCSdefPFuACY880wNnnvuEDweN3bvvn9GG/vlLx9FZ+dZPPXUfjz55O9x4UItXn31f0TiV1KK7DYkv2fAACsJti5diq1Ll97w/b9YuxYA0HyDhcqHmprQ3NeHT55/Hsnx8QCAV3buRNrTT6Omvh5VZWUAgB888AAAYM/hw+EsX31ztKGJqYkoFSLP0juWYukdN25ja+8TbczROXsba/q0CX1dfXi++nnEJ4o2tvMHO/F05dOoP1aPsjVlV772zKEzOPfxOez60S6cOXwmjL+FusY9c7Qx/TcxLF26FUuXbr3h+2vX/gUAwOFonvX9pqZD6OtrxvPPf4L4eNHbtHPnK3j66TTU19egrKwKXV3ncfbs/8P3vncMhYUrAQDbt7+Ef/u3e/HQQ/+M1NSc8P5SCpF9KZTfMyB7PYUGTExOwmQywWa5mt3iLBaYTSYcbGyUWJki5mhDgTx1zqgm3aKNWaxX25jFaoHJbELjqattbLhvGL964VfY+cOdsMZZZZQqhdc3RxtjE5vT5OSEaGMW25X/zWKJg8lkRmPjQQDAxYtHYLenXgkCAFBWVgWTyYxLl/4U9ZqjSfalkGFAA9YWFyPBasVf790Ll9sN58QEvvvmm5jyetGlwhMuZJvjkV8+KPBIMMUVf6kY1jgr9r60F+5xNybGJvDmi2/CO+XFkEO0MZ/Phz0/2INND25CYXmh3IKjbK4woMJT51RXXLwWVmsC9u79a7jdLkxMOPHmm9+F1zuFoaEuAMDQUDeSkubN+L6YGAsSEtIxPNwto+yokd2G5IcB2f8CGpCVlIQ3du3C26dPI/Hb30bKU09hcGwMt+fnw2wyyS5PvjkC5VwncgKS0pKw65924XTtaXx747fx1OanMDYyhvwl+TCZRRs78F8HMO4cx9adN+4q1ivfHOcp3tPMLSkpC7t2vYHTp9/Gt7+diKeeSsHY2CDy82+HyST/UiSb7DYkf84A+eXu8nI0vfACHKOjsJjNSLXbkf3ssyjOzJRdGulE+dpyvPB/X8Do4CjMMWbYk+x49p5nkblQtLG6Y3W4+NlFfGv9t2Z83z98/R+w+iursfMHO2WUTRpSXn43XnihCaOjDpjNFtjtqXj22WxkZhYDAFJSsjEycnnG90xNeeB09iM5OVtGyYYhPwyYmQgDkZkoltfU1NXh8sgIHli2THJFCpijDZl51xGQxFTRxuqO1WGkfwTLNok2tuPZHfjqE1+98nVDjiH87Mmf4fF/eBxFS4uk1Botc7UhnsYCk5j4ecCsq8HIyGUsWyYmPxcXr4PLNYiWlhMoKFgBAKivr4HP50VR0Rpp9UaD7DbEMBAFo+PjaLzmsVSXHA6camtDekIC8tPT0e90orW/H52fP62ivluMjWUnJyM7JQUA8J+HDqFswQJkJSXhSFMTvvOb3+DpLVuwOPtqWm7t77/ys6a8XpxqawMAlGRlITEuLkq/rQQMAxh3jaO37Wobc3Q40FbfhoSUBKRnp8M55ER/dz8GewcBAN0too0lZyQjJVO0sUNvHcKCogVISktC0+km/OYnv8GW/74F2YWijaVnp8/4TJtdTATLys1C2vy0SP+KUjEMAOPjo+jtvTqZ1OG4hLa2U0hISEd6ej6czn7097dicLATANDdXQ8ASE7ORkqKaEOHDv0nFiwoQ1JSFpqajuA3v/kOtmx5GtnZiwEACxaUoaLiK/jVrx7Ho4++jKmpSbz22pNYuXKHrlcSAPLbEMNAFBxvaUHlT3965e/PvPEGAOAv163Dnscew1uffoqdr7xy5f0dv/gFAOD727bh7+6/HwBQ39OD7/3ud+h3OlGYkYG/3boVT1dVzfic//3WW3jlyJErf7/t7/8eAHDgmWewefHiyPxyKoiJufnbppu/rwct51rw0/95tY298S+ija3btg6P/d1j+LT2U7zyg6tt7Bf/S7SxbY9vw/27RBvraenB73b/Ds4hJzJyMrB151ZUPTqzjRlVjHmONqb/JoaWluP46U8rr/z9jTeeAQCsW/eXeOyxPfj007fwyitXh4p+8YsdAIBt276P++//OwBAT089fve778Hp7EdGRiG2bv1bVFU9PeNzvvGNarz22pP4l3/ZcmXToe3b/zXCv518stuQyTfXzJhIO3kSOH5cagmkcbm5wL333vDt9y6+h4sDF6NYEOnNwqSFuK/0vhu+/957wEU2MQrBypXA7bfL+3z5t+V2u+wKSOvmaEP2WLYxCs1cbYinMQqV7DbEMEDaxzBAEcYwQJEmuw0xDJD2MQxQhDEMUKQlJMj9fIYB0r452lBCrOSjjDQvwXrzNsTTGIVKdhuSHwbi4wHuokehmCNSs2eAQjVXG5J9V0faZjaLS6HUGuR+PEQQkB2JSNvmOBPPdVdHNJe5epcYBigUKlwC5YcBAMjIkF0BaZXVCny+K+MNvyTGikTrzb+G6EasMVYk2ZJu/jVzN0OiG0pPn/trIk2NMMD99SlYfradTDvbGAUnI96/mxWexihYWVmyK2AYIK3z8yjKsitwtJEmZSX42cbYxChIKlwC1QgDPIooWOwZoAjzt+2ocEInbVLhEqhGGEhIkD+VkrTJ354BP+/uiK7nbxhQ4YRO2mO3cwLhTDySKFBWK5Cc7NeXxlniOImQAhZrjkVqXKpfXxsXx0mEFDhVepQYBki7AmwznDdAgQq0R4mnMQqUKm1GnTCQlye7AtKaANtMXgrbGAUmLznANsYmRgFSpc2oEwbmzeO8AQpMYWFAX56fkh+ZOki3ClILAvv6wL6cDM5uF5c+FagTBgAeSeS/1FS/5wtMs8faMS9BkSOPlJdiS/F7vsC0+Hh1Tu6kvnyF7k8YBkibgmwrBSlsY+SfQHsFrnwfmxj5SaW2olYYWLgQsFhkV0FaEGwYCPIET8YTbHBU6QRP6rJYxCVPFWqFAdX+dUhNcXHA/PlBfWt6fDqSrDffZ57IFmNDdmJ2UN+bnh7wCBYZkGr3vmqFAQAoKpJdAamusDCkx14XpbGN0c0VpBbAFEobYxOjOajWRtQLA8XFgM0muwpSWXl5SN9ellkWpkJIr8qzQmxjbGJ0EzYbsGiR7CpmUi8MWCxAaansKkhV8+aFvGVXSlwKFiZxOIpml2nPDHnVSXIykJsbpoJIdxYvBmJiZFcxk3phAAj5zo90LExtI9Q7P9KvcLUNnsboRlRsG2qGgZQUxmr6ori4sPWtFaYWIiE2ISw/i/TDGmNFSXpJWH5WQQGfVUBflJur5gRTNcMAoGZ0IrlKS8PWt2YymVCWxYFdmmlxxmJYzOGZ4m0yce4AfVFFhewKZqduGGCspuuFOSAuyVwCs0ndQ4CiL9zDR0uWAGY2MfpcYqJauw5eS91majIBy5bJroJUUVIS9r41e6wdpRmcrEpCcVoxUuJSwvoz4+NFICACgOXLQ1oVHVHqhgFA9LGpOLhC0WU2AytXRuRHr1iwImzdwqRdZpMZq3JWReRn3367WpvLkBzJyWoHQ7XDQAQvAqQhS5ZELBQmWBNQkaXoIB5FTWlGadh7BabZ7cCXvhSRH00asmqV2kNGCpf2uZISICNDdhUki8UCrFgR0Y9Ynr0c1hhrRD+D1GUxW7AyJ7I3HcuWcS81I8vMVG+ToeupHwYAYPVq2RWQLLfeKgZeI8hmsWF59vKIfgapqyKrAvZYe0Q/w2oFbrstoh9BCtPCJUwbYSAvD8jJkV0FRVtcnAgDUbB03tKIXxBIPdYYa9SCYEUFF0gZUU6ONrbN0UYYAIC1a9UecKHwW7lS3FJFgcVswZqFa6LyWaSOlTkrYbNEp/8+JgZYwyZmKGYzsG6d7Cr8o52ra2amWJdBxpCTE/WNp27JuAX5KYouAqawy07Mjvrk0UWL1HtaHUXObbdpZ8qbdsIAINbopKfLroIiLTYWuPNOKR+9qWATJxMagMVswebCzSE9pjhYGzaIETDSt4wMbc0T0VYYMJuBzZs5XKB3a9YASUlSPtoea8f6vPVSPpuiZ1XOKiTb5OxhEh8PrGcT0zUtXqo0VOrnOFygbxKGB65XmlHK4QIdy07MxtJ5S6XWUFICFBZKLYEiSEvDA9O0FwYADhfolcThgettKtgEWwwXhuuNzOGB623cyOECPdLa8MA0bYYBsxn48pfFxYP0Y+NGacMD17PH2rGpYJPsMijM1uetlzY8cL34eNGVrEAuoTCJjRWXJi0ND0zTYMmfS08HKitlV0HhsmyZ6DtVSFFaEW5fcLvsMihMKrIqsCRTrc3h8/O547pemEwiCKSlya4kONoNA4AYdOORpH35+cpu0bUyZyUKUwtll0EhyknKwbo8NRd833ab+lvV0txWrgQKCmRXETxthwFAzB8oLpZdBQUrNVXEaYX7Sr9c9GWkx3OOilYl25JxV/FdMJvUPd3deaeYG03atGiRNucJXEvdoyMQmzdrb+omid0F77knarsMBstituCeRfcgzsLZXloTa47FPYvuidoug8GyWMShYOeO2JqTmanMvOeQ6CMMTB9JEX6gDYWR2QxUVQEpkXlsbLgl2ZJQVVyl9N0lzWSCCZVFlUiL18YgbkICcNddYtti0ga7XVx6LBbZlYROP2e2xETgvvu4VkcLpmfaaOHpHdfIScrBlqItDAQasalgk+bme8yfD9x9tzZnoxtNXJy45CQkyK4kPPTV5NLTgXvvVb7b2fDuvFOz8zyK0opQWVgJE9Sd40DAhvwNWJy5WHYZQcnLE51mDATqstmAbdu0u3JgNvprbpmZDASqMpmATZuA0lLZlYRkUfoisXENA4GS1uetR3mW3F0sQ1VYCGzZwkCgIptN9Ajobd87k8/n88kuIiIcDuAPfwDGx2VXQoAIAps3A7fcIruSsGnqb8KB5gPw+ryyS6HPbczfiLKsMtllhE1LC/Dee8DUlOxKCBBDA9u26S8IAHoOAwDQ3y8CgcsluxJjm94xUqNDAzfTPNiM9y6+x0AgmQkm3Fl4J0oztN3rNJv2dmDfPsDjkV2JsdntIgikpsquJDL0HQYAYHRUHEkOh+xKjCkuTsyIys6WXUnEdI92Y3/Tfox5xmSXYkjWGCuqiquQm6ytCamBcDjEaWx0VHYlxpSVJU5jepksOBv9hwFAROoPPgAuXpRdibFkZIh1N4mJsiuJuFH3KN5tfBd9Y32ySzGU1LhU3LPoHqTEaWOJaijGxoD9+4HubtmVGEtJiZjzrPcln8YIA9NOngSOH5ddhTEUF4s5AnpYgOsnj9eDD5o/wMUBhs5oyEvOw5biLbDGGGeysNcLfPQRUF8vuxL9M5mAVauA5ctlVxIdxgoDANDcDBw4AExOyq5Ev1asEC+DOtl1Esc7GToj6db5t2LNwjVKPIpYhjNngCNHAIOdvaPGahXTnPLzZVcSPcYLAwAwMADU1AB97NINq/h4sXRQy0/rCJOWwRZ82PIhxj1czRJO1hgrNuRvQEm6Wk+4lKGzU4x+ch5BeGVmiiCg14mCN2LMMACI/raTJ4FTp8R/U2gWLQLuuIM7QF5j3DOOg60HOWwQJnnJedhUsAkJVh3P4gqQ2w18/DFQVye7Eu0zm8Vz75YvN+b+DsYNA9P6+kS8Zi9BcOLjgQ0bgKIi2ZUo6+LARRxsPchegiBZY6xYl7tOszsKRkN7O1Bby16CYGVmiilOetw/wF8MAwB7CYLF3gC/sZcgOOwN8B97CQJn9N6AazEMXKuvTxxNHR2yK1FbaiqwerXYM5UCcmngEv7U8ScMTwzLLkVpCbEJWLVwlS43EYq0zk5xGuPWKjeXlwesWWPs3oBrMQzMpr0dOHqUR9P1EhLEKoHFi8W6GwqK1+dFnaMOJzpPcKOi69hibLhtwW2oyKpAjFnnC7sjrKkJOHYMGGbunGHePBECFiyQXYlaGAZu5uJFcTQNDcmuRC6bTfSjVVQYat+ASPN4PTjdcxqne07DPeWWXY5UFrMFX5r3JSzLXmaofQMizesVwwYnT3JXdnZo3hzDwFy8XrHDx6lTwMiI7Gqiy2oFystFEOBTICNm3DOOU92ncK73HDxeY21AH2OKweLMxbh9we2wx9pll6NbHo/Ym+Czz8ROhkaSkiJOYaWl7NC8GYYBf/l8QFsbcO6c+FPP/2yZmSIElJSwJyCK3FNuNPQ14FzvOQyOD8ouJ6KSbckozyrH4ozFsFlssssxDK8XuHQJOHtW39sam0xiu5PyciBXv4+sCCuGgWCMjIhQUF+vn0ckx8SILYQrKsSgGknVOdKJc73n0DzYrJsnIppgQn5KPsqzypGXkie7HMPr7xensQsX9LMha3w8UFYmXnp+qFAkMAyEYmpKxOxLl8SkQ60dUWazeJpgYaHoBeASQeW4Jl2od9SjebAZva5e2eUEJT0+HYWphViSuQSJVv0/tEprJifFZMPmZrGQampKdkWBsVrFyoCiInEqM/oSwWAxDITL1JRY09PSIl5Op+yKZjd95BQUiD9t7KLVCtekCy2DLWgZakHHcAemfGqetc0mM3KScpCfko/C1EIGAA3xeMR9TUsL0Nqq7vyCpCRxCisoEKsCGABCxzAQKQ6HmFvQ2yv+W9bWYDabmAOQlQUsXMgjRyc8Xg/ah9vRPtyOXmcv+sb6pA0nmE1mpMWlISshC7nJuchNzuWKAB3w+YDLl0U4cDjEqUzWioTkZHEamzdPzAHg3gDhxzAQLePj4miaDgf9/aL3IFx9ciaTGDBLSxMX/ukAkJQUnp9PSvP6vOgf64fD5UCvsxcOlwP9Y/1h7z2IMcUgLT4NmfZMZNozkWXPQnp8OvcEMAiX62owcDjEM99cLtGjEA6xsWKsPz396mksM5MdmNHAMCDbxIQ4mpxO8afLJfrmpqbE1F+fT7zM5quvuDjAbp/5io/nuhn6ggnPBFyTLjgnnXBNuq68xibH4PV5r7wAcYc//YqzxCHBmgB7rH3GK87CeSX0RW731dPX9KlsfFycwqZPY4A4fZlMYr5yfPzV01dCgviTi5fkYRggIiIyOA4eExERGRzDABERkcExDBARERkcwwAREZHBMQwQEREZHMMAERGRwTEMEBERGRzDgOL+/d//HSaTCWvWrJFdCunInj17YDKZZrzmzZuHyspK/PGPf5RdHulIU1MTdu3aheLiYsTFxSE5ORl33HEHfvazn2FM1YcfGBD3e1JcdXU1CgsLcfToUTQ2NqKkpER2SaQjP/zhD1FUVASfz4eenh7s2bMH9957L95++21s27ZNdnmkce+88w4efvhh2Gw2fP3rX8fSpUvhdrtx8OBBPPvsszh79ix+/vOfyy6TwDCgtEuXLuHw4cPYu3cvdu3aherqanz/+9+XXRbpyNatW7Fy5corf//GN76B+fPn47XXXmMYoJBcunQJO3bsQEFBAWpqarBgwYIr733rW99CY2Mj3nnnHYkV0rU4TKCw6upqpKWl4b777sNDDz2E6upq2SWRzqWmpiI+Ph4WbhJPIfrRj36E0dFR/PKXv5wRBKaVlJTgO9/5joTKaDYMAwqrrq7Ggw8+CKvVikceeQQXLlzAsWPHZJdFOjI0NASHw4He3l6cPXsWTzzxBEZHR/Hnf/7nsksjjXv77bdRXFyM9evXyy6F/MD4r6gTJ06grq4OL730EgBgw4YNyM3NRXV1NVatWiW5OtKLqqqqGX+32Wz4j//4D9x1112SKiI9GB4eRkdHB7761a/KLoX8xDCgqOrqasyfPx+VlZUAAJPJhO3bt+PVV1/FT37yE8TE8PnxFLrdu3ejtLQUANDT04NXX30V3/zmN5GUlIQHH3xQcnWkVcPDwwCApKQkyZWQvzhMoKCpqSm8/vrrqKysxKVLl9DY2IjGxkasWbMGPT09eP/992WXSDqxevVqVFVVoaqqCo8++ijeeecdlJeX48knn4Tb7ZZdHmlUcnIyAGBkZERyJeQvhgEF1dTUoKurC6+//jpuueWWK6+vfe1rAMCJhBQxZrMZlZWV6OrqwoULF2SXQxqVnJyMnJwcnDlzRnYp5CcOEyiouroa8+bNw+7du7/w3t69e/Hb3/4WL7/8MuLj4yVUR3rn8XgAAKOjo5IrIS3btm0bfv7zn+PIkSNYt26d7HJoDgwDihkbG8PevXvx8MMP46GHHvrC+zk5OXjttdfw1ltvYfv27RIqJD2bnJzEvn37YLVaUVZWJrsc0rDnnnsO1dXV+OY3v4mamhrMnz9/xvtNTU34/e9/z+WFimAYUMxbb72FkZERPPDAA7O+v3btWmRlZaG6upphgEL2xz/+EXV1dQCAy5cv49e//jUuXLiAv/mbv7ky7ksUjEWLFuHXv/41tm/fjrKyshk7EB4+fBhvvPEGHnvsMdll0udMPp/PJ7sIuuqBBx7A/v370dfXB7vdPuvX7Ny5E9XV1ejq6kJGRkaUKyQ92LNnD3bu3Dnjf4uLi8OSJUuwa9cu7Nq1CyaTSVJ1pCcXLlzAj3/8Y+zfvx+dnZ2w2Wy49dZbsWPHDjz++OOw2WyySyQwDBARERkeVxMQEREZHMMAERGRwTEMEBERGRzDABERkcExDBARERkcwwAREZHBMQwQEREZHMMAERGRwTEMEBERGRzDABERkcExDBARERkcwwAREZHBMQwQEREZ3P8HIuEs4hda77sAAAAASUVORK5CYII=",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "venn3([\n",
    "    set(part_first['smiles'].tolist()),\n",
    "    set(part_second['smiles'].tolist()),\n",
    "    set(part_third['smiles'].tolist()),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_1 = pd.concat([part_first, part_second])\n",
    "test_1 = part_third.copy()\n",
    "\n",
    "train_2 = pd.concat([part_first, part_third])\n",
    "test_2 = part_second.copy()\n",
    "\n",
    "train_3 = pd.concat([part_second, part_third])\n",
    "test_3 = part_first.copy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [],
   "source": [
    "min_vertex_k_cut.test_split(train_1['smiles'], test_1['smiles'], threshold=0.4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [],
   "source": [
    "min_vertex_k_cut.test_split(train_2['smiles'], test_2['smiles'], threshold=0.4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [],
   "source": [
    "min_vertex_k_cut.test_split(train_3['smiles'], test_3['smiles'], threshold=0.4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<matplotlib_venn._common.VennDiagram at 0x7f65a3cc23b0>"
      ]
     },
     "execution_count": 27,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAgMAAADVCAYAAADKI/NMAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAAApyUlEQVR4nO3de3Bc1Z0n8O9ttVpSq9V6W7Is62VjW7IA4beNY6zYQBwMmWIhNstMBlfCeqkwCVCBSXaozaOG1CSZJGQYT1GpZMZUUGAD62QhJMEEBfwMNja28UOyJEutp/W0Xt1St1rd+8dBsoUf3ZK6+5x77/dT1WXsbql/Eqfv/d5zzj1HCwaDQRAREZFpWWQXQERERHIxDBAREZkcwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZkcwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZkcwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZkcwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZkcwwAREZHJMQwQERGZHMMAERGRyTEMEBERmRzDABERkclZZRdgWsPD4uHxXP0YGQHGx4FAAAgGxes1DbBYxCMxEbDbLz+Sky//d0qKeA2ZmmfMg0sjl+AZ88Az5oF7zD35354xD0b9owgEA5MPALBolslHkjUJ9nj7VY9kWzIykjKQaE2U/BOSbOPjwMCAOGS53VMPYW434PWK1wSDVx/G4uKApKRrH8KSkwGnU7yWYkcLBif+N1HUDAwAPT1Ad7f4s6cH8Pmi815WK5CRAWRnA1lZ4s+0NAYEAxsZG0G3pxs9nh50u7vR7emGZ8wT1fd02BzIsmch254t/kzOZkAwML8f6Ou7fAjr7gb6+8X1SjRYrUBm5uXDWFYWkJ7OgBBNDAPR0N8PuFxAS0t0T/zhmggI+flAYaH4hJFu+QN+tA62wtXvQutgK9xjbtklARABId+Zj8LUQsxzzoPVwo5HvQoGgY4OcRhra4vuiT9cVqsIBfn5QFGROKRR5DAMREIwCFy8KD45LpfoCVCZ3S5CQWEhMG+e6LMjpXnGPHD1u+AacKFtsA3jwXHZJd2Q1WLFvJR5KEwrRGFqIZLik2SXRCH4fEBrK9DUJK5jvF7ZFd1YSsrlw9jcuez8nC2Ggdno6gLOnRMBYHRUdjUzY7UC8+cDS5aIP0kZ/oAf9X31qOmpQZe7S3Y5M6ZBQ44jB0uylmBB+gLEWRg+VREIiJN/TQ3Q3i7/6n+mbDYRCkpLgdxc2dXoE8PAdPn9QH09cPasGAIwEqdTfJoWLxaTFEmK/tF+nO0+i/O95+EblzzEFGGJ1kQsylyEsuwyOBOcsssxLbdbXMfU1IgJf0aSkQGUlQE33QTEx8uuRj8YBsI1MCACQG2t/DkA0RYXByxYID5Rc+bIrsYUgsEgmvqbcKb7DNqH2mWXExPznfNRll2GgtQCaJwZFhNtbeIw5nLptxcgXDabCARlZWLyId0Yw0Ao/f3A0aNAY6PsSuTIzQVWrwZycmRXYlgXLl3A0bajGPAqPtckStIT07Fq3ioUphXKLsWwWlrEYcxonZnhKioCVq5kKLgRhoHrcbuBY8dETwB/RWJAbtUqfpoiqG2wDR+0fYAej0mP0J+Sk5yD1fmrkevgoG+kdHUBR46I+QBmp2mip2DFCsDhkF2NehgGPs3rBU6cAM6cEfMD6DJ+miKi292NI21H0DbUJrsUJRWkFmDVvFXISOK9YzPV3y9CQFOT7ErUExcHLF0KVFRwatSVGAYmBIMiAHz4ofHnBMxWXBxQXg4sXy7uRqCwjPpHcajlEOr76mWXojwNGhZlLsLa+Wthi7PJLkc3fD4RAs6dY4dmKDYbsGwZcPPNXMwIYBgQBgeB994TawVQ+FJTgY0bOZ8gDI2XGnGg+QBG/COyS9GV5PhkfKbwMyhILZBdivJaW4F9+8Qq5xS+nBzgjjvEQq1mZu4wEAwCp0+LmTUcEpgZTRPResUK9hJcw6h/FAeaD+DCpQuyS9G1RZmLsG7+OvYSXIPPB/z1r+I2QZqZuDgxwdDMvQTmDQPsDYgs9hJchb0BkcVegquxNyCyzNxLYM4wUFMDHDrE3oBI0zQxK2fFCvPGawDjgXHsb96P873nZZdiSGXZZVg3fx0smnnXnw0ExCHs7FnZlRhPXBywbp1Yf81MzBUGAgHg8GExUZCip6AA+OxnxQwdk/GMefB2/dvo9nTLLsXQch25uGvBXabcKXF0FNi7l52a0VZWJkKBWfY8ME8Y8HqBd97hDbexkpYGfO5zYoljk+hyd2Fvw96obx9MgsPmwN0L7kamPVN2KTHT2wu8/TaHBWIlLw/YvNkctyCaIwxcuiQ+QYODsisxl4QE8UmaN092JVFX11uHfa59yu8maDRWixWVRZUoTi+WXUrUNTYCf/kLRzdjLSUFuPtu42+ZbPww4HIB1dXA2JjsSsxJ04C1a8W6BAYUDAZxpO0ITnaelF2KqS2fuxzL85bLLiNqjh0TD5IjPh6orBTLGhuVscPA+fPA++9z9Q0VVFSI5YwNJBgM4r2m91DXVye7FIKYWLi+YL3sMiJu/36xiBDJpWnAhg1iU1cjMm4YOHdOfIpIHTffLHoJDCAQDKC6sZrrByhmceZibCjcYIhdEINBcS1znjelKGX9ejG50GiMGQbOnAEOHpRdBV1LWZn4NOlYIBjAny/8GU39TbJLoWu4KeMmbCzaqOtAEAyK+QH1XLlaSevWGW/k03g3TdTUMAio7OxZcXunTgWDQVQ3VjMIKKyurw77m/XdK/j++wwCKjt0yHhDN8YKA+fPc2hADz7+WOymokPvu97n0IAO1PTU4EDzAdllzMj+/Rwa0AOj/X8yThhobeVkQT2Z2CZaR460HeGqgjpytvssTlw8IbuMaTl2zHhXnEb2/vvi1GMExggDg4PAu+8yCOjN4cO6WQSqoa9BdycWAo62HUXzQLPsMsLS2MjbB/UmGBSnnoEB2ZXMnv7DgM8H/OlPYoVB0pdAQKwKqfhiUD2eHrzvel92GTQDQYg5Hv2j/bJLuaG+PjFhkPTH6xVr2vl8siuZHX2HgWBQLCjU3y+7EpqpiU+SootCjYyN4O36t+EPcNk3vfKN+/Cn+j/B61fzgmF0VHwEuLKgfvX3i1ORnjun9R0GjhwBmvXRBUg3cOmSkp+kQDCAvQ174R5zyy6FZmnQO4g/X/gzVLuTeqJzbGhIdiU0W83Nup0XDUDPYaChATjJJWANw+VSbsD0YPNBdLo7ZZdBEdI21IYP2j6QXcYUhw8DHR2yq6BIOXlSnJr0SJ9hwOMBDujztiG6gY8+Arq6ZFcBAGgZaMG5Hk7rNppTnadwcViNvX9bW3V3Qw2F4cABcYrSG32Ggf37OWHQiIJB4L33gHG5O//5xn3Y59ontQaKnvea3pM+B8TnA/axiRmS16vP5W70Fwbq6kSXMhlTf7/04YLDLYc5T8DABr2DONImd3D3r38FhoellkBR5HKJU5We6CsMeDxiHUgytpMnpQ0XNA80o7a3Vsp7U+yc7jotbbigtVWsmk7GduiQvoYL9BUGODxgDhPbtcV4uMA37sN+lw7792hGZAwXcHjAPPQ2XKCfMNDQwOEBM7l0SUwojKEPWj/g8ICJDHoHcaw9tkNSR45weMBMXC793F2gjzAQCOj7Bk6amVOnYtbP1j/aj5oe9t2azemu0xj2xebsPDDA4QEzOnJEnMJUp48wcPYsV+UwI78/ZpMJj7QdQRBqLUhD0TceHMeH7R/G5L2OHtXHSYEia2hInMJUp34YGBuLeXcxKaS2Nuq7gHS5u9DU3xTV9yB11fXW4dLIpai+R3c3cIE7X5vWRx8pu+L6JPXDwKlTwMiI7CpIlkBAXFJFkezbzEiuIII42h7lNsYmZmojI+JUpjK1w8DoqPq/QYq+CxfEpVUUtA62on1IH9soU/Q09Tehczg6S0+3tgJtbVH51qQjp06JU5qq1A4DeuhbodiI0qUVewVoQrTaQpQ7tkgnVB/xVjcM+HycekuXtbWJTd8jqH2oHT2enoh+T9KvjuGOiLeH9vaodWqRDp07J05tKlI3DNTVsVeAporwri5nu3UwxZdi6kxXhNsYmxhdwe8Hzp+XXcW1qRsGuJ0XfVp9fcRitWfMwzsI6CoNlxrgG49QG/MATU0R+VZkIOcU3QxVzTDQ3i42rCG60thYxHb/ONd9DoEgb/qmqfwBP2p7IrM3RU0N1xWgq126JE5xqlEzDLBvja4nAm0jEAxwtUG6rkgMHwWD6l4BknwqnuLUCwPsW6MbiUCsdvW7uAcBXdeAdwCtg62z+h4uF+BmE6PraGpSb0dD9cLA+fPsW6Mbq51dNy57BSiU2Q4V8EYoupFAQL2JhOqFAfYKUCjNzTMOjGPjY1xkiEJqGWyZ8ZwSv5+LDFFoqp3q1AoDIyNAV5fsKkh1Xi9w8eKMvrR1sBXjwfEIF0RG4xv3zTg0trQA42xiFEJ3t1or7asVBlwu2RWQXsywrbgG2MYoPK7+GbYxNjEKQzCoVlthGCB9mkFbCQaDaB5ojkIxZEQzCY7BoBjFIgqHSqc8dcIAB9poOgYHxZ0F09Dp7sSoX+GdQkgpw75h9Hp6p/U1nZ1qb0ZDamlrE6c+FagTBlT6rZA+TDNWc8VBmq7p9g6odKVH6lPpGlitMEA0HdNsM7yLgKZrum1GxZXlSG2qnPrUCQM93D2OpmkabSYQDKBvJLK7HpLxTWcXw0AA6J3eqAKRMqc+NcJAMKjOb4T0w+sVcwfC0DfSx70IaNp84z4MjA6E9dq+Pq6XRtPX0yNOgbKpEQb6+zlfgGYmzBDZ7eam8jQz4fYO8HqGZsLvBwbCy5tRpUYY4KeIZirMtjOd7l6iK3V7wguS3cybNEMqtB01woAKvwnSpzDbTrgHdKJPCzdI8jBGM6XC9bAaYUCF3wTpUxhth5MHaTbCCQOBgJgzQDQTKgRJNcJAf7/sCkivvN6Qe4EOegc5eZBmzDfug9t34/2IBwc5eZBmToVToPwwMD7OJbtodkKEAc+YYhuHk+6EakOq7U1P+jI6Kj9Myg8D/BTRbDEMUJQxDFC0yW5DDAOkfyHaUKguXqJQQoUBN5sYzZLsUyHDAOkfewYoytgzQNEmuw1Z5b495P8GYmDf+fP40d69ONbcjI6BAfz2scfwNxUVk8/vOX4cL+7bh2PNzehzu/HRs8+iYv78Kd+jobsb33j9dRyor4fX78fnli7FC9u3I8fpnHxNn9uNf3j1Vbx56hQsmob/tmwZfvbFL8KRmBirH1UOhgGcP34ee3+1F83nmjHQM4DH/vUxVGysmHz+ePVx7Pu/+9Bc0wz3gBvPVj2L+YuntrHu1m68/vzrqD9RD/+YH0vXLsX2p7fDmenEp435xvAvj/wLWs+3XvN7GY177MaX/iY4jOH8+X3Yu/dHaG4+hoGBDjz22G9RUfE3k88fP74H+/a9iObmY3C7+/Dssx9h/vyKKd+ju7sBr7/+DdTXH4Df78XSpZ/D9u0vwOnMmXzNH/7wHD7++C20tJyA1WrD88/3x+YHlEx27xJ7BmLA7fPh1vx87Hrooes+v37hQvzg/vuv/bzXi7uefx4agOqnnsLBZ56Bz+/Hvbt2IXDFrJOHf/lLnGlvxztPPIHfP/449tXV4X+8/HI0fiS1MAzAN+JD/k35eOgfr93GfCM+LKxYiPv/4dptzDvixfNffR7QgKdefArP/PIZ+Mf82PXk1DY2Yc+/7UFaVloEfwK1sWcA8PncyM+/FQ89tOu6zy9cuB733/+Daz7v9brx/PN3AdDw1FPVeOaZg/D7fdi1694pbczv92H58gdxxx2PRePHUJbsNiS/Z8AEdxJsKS/HlvLy6z7/d2vWAACarnPP/MGGBjT19uKjZ5+FMykJAPDSjh1If/JJVNfWYnNpKc51dOBPZ87g6Le+hRVFRQCAF7Ztw+f//d/xrw88gLy0tIj+TEoJ0YZG/cZvY+W3l6P89uu3sTX3iDbW037tNtZwsgG9Hb14tupZJDlEG9vx3R14svJJ1B6tRenq0snXnj54Gmf/ehY7f7gTpw+djuBPoa5QbcgEhzGUl29BefmW6z6/Zs3fAQB6epqu+XxDw0H09jbh2Wc/QlKS6G3aseMlPPlkOmprq1FauhkAcN993wUAHDq0O3LF64DsNiS/Z0D2/RQ64B0bg6ZpSLBezm6JVissmoYD9fUAgMMXLiDNbp8MAgCwubQUFk3DB42NsS45tkK0Ia4xENqYT7Qxq+1yG7ParNAsGupP1E/+22DvIH713K+w43s7YEu0yShVilBtiIex0MbGvKKNWRMm/81qTYSmWVBff0BiZWqQ3YYYBnRgTUkJkm02/OOePfD4fHB7vfjG669jPBBAxyc7XFwcGMCclJQpX2eNi0NGcjIuhrmzn24xDMxayc0lsCXasOeFPfCN+uAd8eL1519HYDyAgR7RxoLBIHZ/dzc23L8BRWVFcguOsWCIbeV4GAutpGQNbLZk7Nnzj/D5PPB63Xj99W8gEBjHwECH7PKkk71zofwwIPs3oAPZKSl4bedOvHnqFBxf+xpSn3gC/SMjWFZQAIumyS5PvhBH4iDYxkJJSU/Bzh/sxKl9p/C1z3wNT2x8AiNDIyhYUgDNItrYX/7PXzDqHsWWHdfvKjaqUIGSh7HQUlKysXPnazh16k187WsOPPFEKkZG+lFQsAyaJv9UJJvsQCl/zgCF5a6yMjQ89xx6hodhtViQZrcj9+mnUZKVBQDITU1F19DQlK/xj4+jz+1GrvPq2eCGwkAUEWVryvDc/3sOw/3DsMRZYE+x4+m7n0bWPNHGao7W4MLHF/DVdV+d8nXf/9L3sepzq7DjuztklB0TGttYRJSV3YXnnmvA8HAPLBYr7PY0PP10LrKySmSXZnryw4CFiXA6shwOAEB1TQ26hoZw3623AgDWlpSg3+PBMZcLywsLxWtqaxEIBrG6uFhavTER4kBt4VXHtDjSRBurOVqDob4h3LpBtLHtT2/HFx77wuTrBnoG8LPHf4ZHv/8oisuN3cY0hGhjbGLT4nB8EjBrqjE01IVbb71PckXyyW5DDAMxMDw6ivortqVq7OnBiZYWZCQnoyAjA31uN5r7+tD+yW4VtRcvAgBynU7kpqYCAP7r4EGUzp2L7JQUHG5owNd/8xs8uWkTFufmAgBK587F55YuxaO/+hVefPhhjI2P4/FXXsH2FSuMfScBELINmSEMjHpG0d1yuY31tPWgpbYFyanJyMjNgHvAjb6Lfejv7gcAXHSJNubMdCI1S7Sxg28cxNziuUhJT0HDqQb85se/wab/vgm5RaKNZeRmTHnPBLuYCJadn430nPRo/4hShWpDJjiMYXR0GN3dlyeT9vQ0oqXlBJKTM5CRUQC3uw99fc3o728HAFy8WAsAcDpzkZoq2tDBg/+FuXNLkZKSjYaGw/jNb76OTZueRG7u4snv29fXPPm9AoFxtLScAABkZy9EYqIjRj9t7MluQwwDMfChy4XKn/xk8u9PvfYaAODv167F7kcewRsnT2LHSy9NPr/9F78AAHx761Z85957AQC1nZ341u9+hz63G0WZmfinLVvw5ObNU96n6stfxuOvvIJNP/3p5KJD/7ZtW7R/PPni4m74tBnCgOusCz/5n5fb2Gs/FW1s7da1eOQ7j+DkvpN46buX29gv/pdoY1sf3Yp7d4o21unqxO92/Q7uATcy8zKxZccWbH54ahszqzhLiDZm/CYGl+tD/OQnlZN/f+21pwAAa9f+PR55ZDdOnnwDL710eajoF7/YDgDYuvXbuPfe7wAAOjtr8bvffQtudx8yM4uwZcs/YfPmJ6e8zxtv/G8cPny5rf7zP98GAHjqqb9g8eKN0fjRlBDiMBZ1WjDUNNloO34c+PBDqSWQzpWUAJuvf9L6Q90f0DrYGsOCyGiK04px54I7r/v8H/4AtLKJ0SysWAEsWybv/eXnWbtddgWkdyHakD2ebYxmJ1Qb4mGMZkt2G2IYIP1LTr7h0wwDNFvJthBtjE2MZkl2G2IYIP1jzwBFGXsGKNpktyGGAdI/hgGKMoYBirYQHZxRJz8MJCVx0RiaHYYBijKGAYomiwWQvdO8/DCgafwk0eyEiNQOm3HvTabYSI4P0cbYxGgW7Hb518TywwAAZGbKroD0yuEAbDfePc9hc8AWZ54d9iiykuOTkXDFTnvXEkYzJLqujIzQr4k2NcLAJ+vrE01bdnZYL8uys43RzGQnh9nG2MRohlRoOwwDpG9hth2GAZqpcNtOmLmU6CoqtB01woAKvwnSpzDbTradbYxmJtwwwGsamikVToFqhIHkZHFXAdF0sWeAoizcIKnCAZ30x25XYw69GmEA4CeJps/hCPt+nNTEVE4ipGlLjk9GUnx4FypOJycR0vSp0qPEMED6NWfOtF7O3gGarnAnD06+nocxmiZV2ow6YWD+fNkVkN5Ms83Md7KN0fRMt83wMEbTpUqbUScMzJmjxsAJ6YOmAQUF0/qSwrTCKBVDRjXdNlNUFJ06yJjs9ml3cEaNOmEAmPbBnUwsO3vak07TEtOQmpAapYLIaLLt2dNeytrpBNLSolMPGY9Kpzy1wkAhr9woTDO8BGPvAIVrpm2FhzEKl0ptRa0wMG8eYLXKroL0YIafoqK0osjWQYZVmMowQNFjtYpTnirUCgOq/XZITU4nkJ4+oy/NSc5BolXy9mCkPIfNgUz7zPZMycmRvwMdqU+1a1+1wgAAFBfLroBUN4s2omnajK/4yDyK02bTxjiRkEJT7VSnXhgoKQESbrxDGJlcaensvjx7dl9PxjfbNlJWFqFCyJASEsSpTiXqhQGrFVi8WHYVpKr8fDFMMAtzkudwrwK6rryUPKQlps3qe2RlqbOYDKln8WK1hggAFcMAwFhN17d0aUS+TVk22xhd29LsyLSxCDVVMiAVT3FqhgGnU1wBEl3J4YjYjbkLMhYgIY7DUTRVcnxyxG4/XbCAI550tQh0bkaFmmEAUDM6kVylpWJ2VgRYLVYszuJwFE21JGsJLFpkDotxcRzxpKupempTNwwUFoorQSIAsFiAJUsi+i05VEBXsmiWiE8uVfXAT3I4HOquQ6FuGNA0oKJCdhWkiiVLpr38cCjOBCdK0hWb0kvSLMpcNO3lh0NxOsVwAREgTmkR6tyMOHXDACBOACoOrlBsWa3AsmVR+dYr81ZGrFuY9CtOi8Pyucuj8r1XrhQdW2RuTmfEOzcjSu0marGITxKZ2803R21Hy9TEVCzO5MCu2ZXPKUeyLTkq31v1kwDFxooVaodChUv7xIIF4qZdMqfERODWW6P6FsvzlsNqUeymX4oZW5wNFbkVUX2PZcvUu6+cYicrC1i4UHYVN6Z+GACAVatkV0CyVFQANltU38Ieb0f5nPKovgepqyK3AgnW6N4DaLeLDi4yJz2cwvQRBvLzgbw82VVQrDkcMVu5pSK3gusOmFAsg+Ctt3IDIzPKy9PHsjn6CAMAsHat2gMuFHlr1oibtWPAFmfD8rzoTCAjda2atypmQ0Q2mxg3JvOwWMRhTA/0c3bNzOSthmZSXBzznTzK55Qj15Eb0/ckeQpSC7Aoc1FM37OsjJ2cZlJRoZ8pb/oJA4CYhZORIbsKirbERGD9eilvvbFoIycTmoAtzobPFHxGynvfcQcQHy/lrSmGMjKidkd0VOgrDFgswMaNHC4wuttvj/gCQ+FyJjixap4OZvvQrKybvy5qtxKGkpICrF4t5a0pRvR4qtJRqZ/IyuJwgZEVF0tfsq18TjnmOuZKrYGiR8bwwKdxuMDY9DQ8MEF/YQDgcIFRSRwe+LQ7iu7gcIEByRwe+DQOFxiT3oYHJugzDFgswKZN/CQZiaaJfjVJwwOf5kxw4vb5t8sugyJsQ+EGacMDn5aSokz2pQiJjwc++1l9DQ9M0GHJn0hPByorZVdBkbJyJVBQILuKKRZnLeZiRAZyW+5tym1MddNNwC23yK6CIqWyUr+d1voNAwBQVMQbd41g4UJl54GszV+LeSnzZJdBs1SUVoSV89Tc52T1amD+fNlV0GytWCFOSXql7zAAiMGZGN+PThGUnQ1s2CC7iuvSNA2bSzbDmcDdM/UqIykDlUXq9iJqmhj1TEuTXQnNVEmJPucJXEn/YQAQY816m7pJYsH2u+5SfgeXBGsC7l5wN+ItnKOiN4nWRNy14C7Ex6n9/85mA+6+O+rbcFAUZGWJU5DeGSMMWK3ipBKlbW4pCib+nyWrMZkrlPSkdHy2+LPQoMkuhcJk0Sy66tVJTQU2b9bn5DOz0sn1TFiM0+wcDuCee7gTiB7ExYlP0Jw5siuZlsK0QtxRdIfsMigMGjRsKt6EvBR93cyfny8moWnMnMpLTBSnHIdDdiWRYZwwAIg7DO65B0jg7nPKsljE5Y8etvG6hkWZi5S5T52uTYOGyuJKFKcXyy5lRhYsEGsQkLpsNuDznxenHKMwVhgAxIZGDARqmlgforBQdiWzUppdyjUIFKVBwx1Fd2BhxkLZpczKokViXi17CNQzEQSMNk1NCwaDQdlFREVvL/DWW8DoqOxKCBBDA3feqdxaArNR01OD/a79CMKYHyG9sWgWbCzaqPsgcKW6OuC99wCDHqV1JzHRmEEAMHIYAIBLl0Qg8HhkV2JuE5MFdTo0cCN1vXV4r+k9BgLJLJoFm4o36XZo4EYuXACqq4FAQHYl5ma3iyCg10WFQjF2GAAAtxvYuxfo7pZdiTk5HCIIGDFKf6J1sBXvXngX3nGv7FJMaeL2wVxHruxSoubiRXEYY0enHFlZ4jBmlMmC12L8MAAAfj+wbx9QXy+7EnPJzRVDA4rsNxBNA6MDeLvhbfSP9ssuxVQykzJx98K74bAZ+Cj9ieFh4O23xQgoxc7EhE4j3D54I+YIAxNOnACOHuUAXCwsWSJ2YTHRTdO+cR+qG6vRPNAsuxRTKEkvwcaijabaXdLvF3MILlyQXYk5rFwJ3Hab7Cpiw1xhAACam4F33wXGxmRXYkwWC7BmDVBuzg1+gsEgjrQdwcnOk7JLMbTlc5djed5y2WVIc+yYeFB0TOw+qPMbn6bFfGEAAPr7xYycnh7ZlRiLwyHW5czT10Iv0VDfV48DzQfgG/fJLsVQEq2J2FC4AUVpRbJLkc7lEqOfIyOyKzGWzEwRBIy0hkA4zBkGADE198QJ4PhxTtONhNJS0SMQr/Ya8LHk9rmxv3k/hw0ipDitGOsL1iMp3vhzUMI1OgocOMBhg0iwWMSQwG23mWp0c5J5w8CEvj4xCMdegplxOMTqKAa8bTBSzveex6GWQ+wlmKFEayJun387FmQskF2KshobRShgL8HMZGaKTs3MTNmVyMMwALCXYKbYGxA29hLMDHsDwsdegukze2/AlRgGrtTXB3zwAdDSIrsStWVliRDAuQHTVtdbh6PtRzHsG5ZditKcCU6smrcKJeklskvRnaYm4MgRMTWKrm/ePHEYM3NvwJUYBq6lvV18mrq6ZFeiltRUYMUKceMtzdh4YBxnus/go46PuFDRpyRZk7Bs7jKUZpfCopn8Um0WgkGgtlbcceB2y65GLVlZwOrVIgzQZQwDN8KILdjtwLJlYu0As/elRZBv3IeTF0/i466P4Q/4ZZcjlS3OhltybsEtObeYat2AaPP7gTNnxCio1+S5MzVVrBtQws6ma2IYCCUYBM6fF5+mgQHZ1cSW3S7WCygvN/7yWxJ5xjw43nEctT21GA+Oyy4npqwWK0qzSnHb3NuQaE2UXY5h+XziEHb2rPhvM0lJASoqgMWLeS1zIwwD09HaKj5NLpexVzHMzQWWLgWKi/npiSGv34va3lqc7T6LQe+g7HKiKi0xDWXZZViUuQi2OJvsckzD7xersp89a+wbqDQNmD8fKCsTf3Ir6NAYBmZieBg4dw6oqTHOvTzx8cBNN4lPj1G35dKRloEWnO0+i+aBZsPsiGjRLChMLcTSOUuRl8LJp7J1dYkhhAsXgHGDdEglJooegLIy0SNA4WMYmI1AQMwraGwUdyDorf8tLk7MoikqEpMCeYugcoZ9w6jtqUVTfxN6R/S5Q02WPQvFacVYnLUY9ni77HLoU0ZHRW9BU5PYHVFvd1fHx4tlToqLxSMuTnZF+sQwECmBANDRIYYQXC5gaEh2RdeWlAQUFIhFt/PzORdAR4Z9w3D1u+AacKF9qB2BoJpH7TgtDnkpeShMK0RhaiGSbcmyS6Iweb3iusblUvv6JjlZHMIKC8UdzgwAs8cwEC19feLT1N0tBucGJY0B2+1Adra4nyY/H5gzhwNoBuAb96F1sBWtg63o8fSgb6RPWjiwaBZkJGUg256N+anzke/M5x0BBjBxfdPWdvkwJuuOBIdDHMKys8UcgKwsOXUYGcNArHi94tPU0yM+WX194gbgSO2eaLWKE396+uVPTVaW+DcyvPHAOPpG+tDt6UaPpwc9nh5cGrkU8bsT4rQ4ZCRlIMuehezkbGTZs5CRlME1AUxiaOhyMOjuBi5dEtOmInUWiYsTV/0ZGZcPY9nZYi4ARRfDgGx+P+DxiGDg8YjHyIiY0RMMXh7A0zQxs99iEZ+M5GRxop942Dgjm6426h+FZ8xz1WNkbASBYGDyAYgr/IlHUnwS7PH2yUdyfDLs8XYkWBMk/0SkmmBQHLImDl8Tj9FRcfiaeGja5cNYXJwYsZw4fE0czhLYvKRhGCAiIjI59u0RERGZHMMAERGRyTEMEBERmRzDABERkckxDBAREZkcwwAREZHJMQwQERGZHMOA4v7jP/4DmqZh9erVskshA9m9ezc0TZvymDNnDiorK/HHP/5RdnlkIA0NDdi5cydKSkqQmJgIp9OJ22+/HT/72c8wYpRdXw2AC4grrqqqCkVFRThy5Ajq6+uxcOFC2SWRgXzve99DcXExgsEgOjs7sXv3bnz+85/Hm2++ia1bt8ouj3TurbfewoMPPoiEhAR86UtfQnl5OXw+Hw4cOICnn34aZ86cwc9//nPZZRIYBpTW2NiIQ4cOYc+ePdi5cyeqqqrw7W9/W3ZZZCBbtmzBihUrJv/+5S9/GTk5OXjllVcYBmhWGhsbsX37dhQWFqK6uhpz586dfO6rX/0q6uvr8dZbb0mskK7EYQKFVVVVIT09Hffccw8eeOABVFVVyS6JDC4tLQ1JSUmwcmtrmqUf/vCHGB4exi9/+cspQWDCwoUL8fWvf11CZXQtDAMKq6qqwv333w+bzYaHHnoIdXV1OHr0qOyyyEAGBgbQ09OD7u5unDlzBo899hiGh4fxt3/7t7JLI5178803UVJSgnXr1skuhcLA+K+oY8eOoaamBi+88AIAYP369cjPz0dVVRVWrlwpuToyis2bN0/5e0JCAv7zP/8Td955p6SKyAgGBwfR1taGL3zhC7JLoTAxDCiqqqoKOTk5qKysBABomoZt27bh5Zdfxo9//GPExcVJrpCMYNeuXVi0aBEAoLOzEy+//DK+8pWvICUlBffff7/k6kivBgcHAQApKSmSK6FwcZhAQePj43j11VdRWVmJxsZG1NfXo76+HqtXr0ZnZyfeffdd2SWSQaxatQqbN2/G5s2b8fDDD+Ott95CWVkZHn/8cfh8PtnlkU45nU4AwNDQkORKKFwMAwqqrq5GR0cHXn31Vdx0002Tjy9+8YsAwImEFDUWiwWVlZXo6OhAXV2d7HJIp5xOJ/Ly8nD69GnZpVCYOEygoKqqKsyZMwe7du266rk9e/bgt7/9LV588UUkJSVJqI6Mzu/3AwCGh4clV0J6tnXrVvz85z/H4cOHsXbtWtnlUAgMA4oZGRnBnj178OCDD+KBBx646vm8vDy88soreOONN7Bt2zYJFZKRjY2NYe/evbDZbCgtLZVdDunYM888g6qqKnzlK19BdXU1cnJypjzf0NCA3//+97y9UBEMA4p54403MDQ0hPvuu++az69ZswbZ2dmoqqpiGKBZ++Mf/4iamhoAQFdXF37961+jrq4O3/zmNyfHfYlmYsGCBfj1r3+Nbdu2obS0dMoKhIcOHcJrr72GRx55RHaZ9AktGAwGZRdBl913331455130NvbC7vdfs3X7NixA1VVVejo6EBmZmaMKyQj2L17N3bs2DHl3xITE7FkyRLs3LkTO3fuhKZpkqojI6mrq8OPfvQjvPPOO2hvb0dCQgJuueUWbN++HY8++igSEhJkl0hgGCAiIjI93k1ARERkcgwDREREJscwQEREZHIMA0RERCbHMEBERGRyDANEREQmxzBARERkcgwDREREJscwQEREZHIMA0RERCbHMEBERGRyDANEREQmxzBARERkcv8feGAi3q9Qs/8AAAAASUVORK5CYII=",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "venn3([\n",
    "    set(test_1['smiles'].tolist()),\n",
    "    set(test_2['smiles'].tolist()),\n",
    "    set(test_3['smiles'].tolist()),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<matplotlib_venn._common.VennDiagram at 0x7f65a40c5cc0>"
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAZIAAAGJCAYAAACgk7WiAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAABHRUlEQVR4nO3deZSddZkv+u877nmo2jWnKkOlMlRmyEBIQgAJIKMeHMCDtLLURXv6tLY2euyly1b7aHsvF9qh6Ub7XBe9NNgHufS9tDQzKEgiBAICgZB5rHnY897vfP94yVypVNUefu/wfNaqFaiq7P2k6t37+/5mzrIsC4QQQsgM8awLIIQQ4m4UJIQQQipCQUIIIaQiFCSEEEIqQkFCCCGkIhQkhBBCKkJBQgghpCIUJIQQQipCQUIIIaQiFCSEEEIqQkFCCCGkIhQkhBBCKkJBQgghpCIUJIQQQipCQUIIIaQiFCSEEEIqQkFCCCGkIhQkhBBCKkJBQgghpCIUJIQQQipCQUIIIaQiFCSEEEIqQkFSQ//0T/8EjuNwySWXsC6FEN948MEHwXHcGR8tLS248sor8cQTT7Auz5NE1gV42datWzF37ly8+uqr2LdvH3p6eliXRIhvfO9738O8efNgWRYGBwfx4IMP4vrrr8d//Md/4MYbb2RdnqdQi6RGDh48iG3btuG+++5Dc3Mztm7dyrokQnzluuuuw6c//WnccccduPvuu/HSSy9BkiT8+te/Zl2a51CQ1MjWrVvR0NCAG264AR//+McpSAhhLJlMIhQKQRSpI6baKEhqZOvWrbjlllsgyzI+9alPYe/evdixYwfrsgjxjUwmg5GREQwPD2PXrl344he/iHw+j09/+tOsS/MciuYaeP3117F792789Kc/BQBs2rQJnZ2d2Lp1K9auXcu4OkL8YcuWLWf8fyAQwC9+8QtcffXVjCryLgqSGti6dStaW1tx5ZVXAgA4jsOtt96KX/3qV7j33nshCALjCgnxvvvvvx8LFy4EAAwODuJXv/oVPv/5zyMWi+GWW25hXJ23cJZlWayL8BLDMNDV1YXLL78cf/d3f3fy82+88QY++clP4qmnnsI111zDsEJCvO3BBx/EnXfeiR07dmDNmjUnP2+aJi666CIMDw/j0KFDkGWZYZXeQmMkVfb888+jv78f//Zv/4YFCxac/PjkJz8JADToTggjPM/jyiuvRH9/P/bu3cu6HE+hrq0q27p1K1paWnD//fef87VHH30U//7v/44HHngAoVCIQXWE+Juu6wCAfD7PuBJvoSCpolKphEcffRSf+MQn8PGPf/ycr3d0dODXv/41HnvsMdx6660MKiTEvzRNw9NPPw1ZltHb28u6HE+hIKmixx57DLlcDjfffPOEX1+/fv3JxYmeDhJdP/ND0wDLAiTJ/pBl+0+OY12pZ+mmDs3QYFgGBE6AyIsQeRGcj37mTzzxBHbv3g0AGBoawkMPPYS9e/fiG9/4BuLxOOPqvIWCpIq2bt2KYDB43umFPM/jhhtuwNatWzE6OopUKlXnCmfINIFczv7IZk/9mc/bIXEiLHQdMIypP64ongqX00MmHAYSCfsjHrc/fLyIzLRMZJXsGR9lvQzN0KCZ2oR/Wph4Do3ACZAE6WSwiLwIibf/PygGEQvEEA/EEZPtPyNypM7/2ur59re/ffK/g8EgFi9ejH/+53/GXXfdxbAqb6JZW+SUYhEYHATGx08FRi4HFAp2i4KlSORUsJwImUQCSCY90bKxLAsZJYNMOYOMkjkZGJlyBnk1f95gqDWBE84Jl3ggjqZwk6tDhlQXBYlfWRYwOmoHx4mPXI51VdMny0Bb26mPlhaAd/5kRN3UMVQYwkB+AAP5AQzmB6GZGuuypiUqR9EaaUVrtBVt0TakQilfdZ2RUyhI/EJRzgyNoSG7K8prBAFobgba2+1gaW21w4axsl4+GRoD+QGMFEdgWibrsqpK5EW0RFrQFm07GTCywP5nT2qPgsTL0mng0CHg8GE7OPz4q+Y4IJUCOjuB7m6gqakuT2tZFvpyfTiYPoi+XB/S5XRdntdpUqEU5iTnYG5yLprC9fnZk/qjIPGaoSHg4EE7PNJp1tU4TyJhB0p3tx0wVWRZFvrz/dg/th+H0odQ0ktVfXy3i8pRzEnMwbyGeWiPtlM3mIdQkHjB6Ciwfz9w4IA9SE6mJpk8FSqNjTN6iBPhcWD8AA6OH6TwmKKQGEJ3QzfmN85HW7SNdTmkQhQkbqUowO7dwPvvU8ujGhoa7EDp6bFbLRfQn+vH/vH9FB5VEJWjmN8wH73NvYgHaH2HG1GQuM3YGPDOO8C+fd4cLHeCzk5g2TKgq+uMqcWaoWHP6B7sGt7l2zGPWuLAYXZiNpa1LMOs+CzW5ZBpoCBxA8uyxzzeeQfo62NdjX/E48CSJcjMbcc76T3YO7YXqqGyrsoXGkONWNayDD2NPRB5/y5GdQsKEidTVbv7atcud67xcLlyMoBsA4eiqGIkHMQeUUUe1Aqsp6AYxOKmxVjavJQWQDoYBYkT5XLAn/4E7NlD3VcMFFNBZBImVO6s1gcHpEMh7JF0jHPuWjzodjzHY25yLpa3LEdrtJV1OeQsFCROUi4Db7xht0BMby1Wc4NSQxDphgkCZALjkRDeEzXkOAr6epudmI1LZl2ChlAD61LIByhInEDX7fGPN9+0u7NIXZUTAWRSQJlTpvcXOWAkHMJ7kooiprFZJakYBw6LmhZhTccahKUw63J8j4KEJcuyu69ee83eGJHUlRqTkW7iUOKnGSBnsXgOQ+EQ3hPKUDhqSdaTyItY3rIcq9pWQRIk1uX4FgUJK0eOAK++ak/nJXVlSDzGOwIoiNVd/2HyPI5EA9jDlWDRou26CopBrG5fjd7mXvCc8zft9BoKknobGQG2bwf6+1lX4jsWgHxbCOmIAhO1azmUZRnvhoDhKYy1kOpKBBJYO2stuhu6WZfiKxQk9WIYwOuv27Ox6Eded0pcxlgTpjSQXi2jkRDekhSoNQwtMrHOeCc2z9mMqBxlXYovUJDUw/Aw8Lvf2QdGkboyJB6Z9gByEpttTAxBwMGIjP08baNSb7IgY33neixuWsy6FM+jIKklaoUwVWoMYrRBheGAFkEhGMTOoEazuxjoindh85zNtKCxhihIaoVaIcyYPId0Z5BZK+R8TJ7H3piMQ1yZdSm+IwsyNnRtwMLUQtaleBIFSbWZpj2dl1ohTChxGaPNFjQ4d+X5WDiINyUFGkfXR73NSczBZXMuo7UnVUZBUk0jI3YrhKb01p0FIDsrjEywCDdc0JokYldYwOB0F0GSigWEADbO3oiexh7WpXgGBUm17N0LvPiiPS5C6koPCBiZJUJx4ZtyfyyMt/kirTthYFFqES6bcxmtO6kCCpJKWRbwyivAW2+xrsSXyokARpp0GC4exM6HgtgRUGmaMAOtkVZcPf9q6uqqEAVJJRQFePZZ4Phx1pX4Uq4thPFIyRVdWReiShLeiABpB4/teFVEiuCa+degOdLMuhTXoiCZqbEx4Omn6Yx0Biyew1hXEPkqb3HCmsnzeD8m4wjN6qo7gROwec5mLEgtYF2KK1GQzMTBg8ALL9BZIQwYAQHDswQoHt5+pC8WxttCkXUZvrSidQUumXUJOI4GraaDgmS6duywzwwhdadGZQy1Gq4eD5mqTDiEHVIZBk0RrrvOeCeumncVAmKAdSmuQUEyVYYBPPcccOgQ60p8qZwMYDil1XSzRacpBgP4Y0Cl9SYMxANxfLjnw0gGk6xLcQUKkqnQdeCpp2hQnZFiKoiRpALLE8Pq06PIMv4Y1lH2UYA6RVAM4oYFNyAVTrEuxfEoSC5E04Ann6Rt3xnJt4YwGvXWoPp0aZKEVyMW8qAxuXoLCAHcsPAGNIWbWJfiaBQkk1FV4IkngMFB1pX4UqYjjHSIBp0BQBdE7IxyGOdoenC9yYKM6xdcj5ZIC+tSHIuC5HwUBfjP/7Q3XyR1N94VRlamEDmdyfN4MybSgVkMyIKM63quQ2u0lXUpjkRBMpFyGXj8cWB0lHUlvpTuDCMToBCZiMnzeD0uYIwWLtadxEv4cM+H0R5rZ12K41CQnK1YtEOEtn9ngrqzLswQBLwW42kVPAMiL+La+ddiVnwW61IchXYrO12hAPz2txQijGTbKUSmQjAMrM5ZiFki61J8Rzd1PLnvSRzLHmNdiqNQkJygqvaYSDrNuhJfyreGMB6mEJkq0dCxtgiEIbAuxXcMy8BT+55CX66PdSmOQUEC2IdRPfsstUQYKTTTFN+ZkDQdlxR4BOllXHeGZeCZ/c8gU86wLsUR6AoEgD/8AThGTVUWSg0BjMYpRGZK1jSsL4oQQXtD1ZtiKHhi3xMo67TJJgXJn/4E7N7Nugpf0sISRho1H65Xr66AqmKNGmRdhi9llSye3v80TMvfOw/4O0gOHLAPpSJ1Z0g8htotX+2dVUuJYgkrDDqciYWB/AB+f+j3rMtgyr9BMjRkn69O6s7igJEuCTpt+VFV7bkiuq0Q6zJ8ae/YXuzs38m6DGb8GSS5nL0JI50nwsTY7BDKLjxf3Q16smW0QGZdhi+91vca9o3tY10GE/4LElW1N2Es0QAvC9mOsOdONnQSzrKwImcgYtG0YBZ+f+j3GMz7b28+/wXJCy/QNF9GyskAxmnBYc0JhoE1JcGHL272DMvAU/ufQkEtsC6lrvx1rb37LnD4MOsqfMmQBYykqCuxXoKqilU6Db6zUNbLeOHQC/DT7lP+CZJ0GvjjH1lX4UsWgJFOyRdH5DpJc76IORZNC2ahL9eHtwbfYl1G3fgjSEwTeP55GlxnJNsRRpmjRVssLMypiIL25GJhR98OjBb9sYO4P4Jkxw5gZIR1Fb6kxGVkaFyEGd40cVFJAB37Xn+mZeL5g8/DML3fEvd+kPT1AW/5p4npJKbAYaTZpJXrjIUVBUtMWl/Cwnh5HK8c9/6iZ28HiaLYs7R8NOjlJOOdQVp06BCd+RKaaH0JE+8MvYOjmaOsy6gpbwfJSy/ZZ4yQuisnA7RexEksYFkR1MXFyO8P/97Tmzt6N0j27LH30iJ1Z/EcxlK0h5bTBFQVvRZNCWahqBXx4uEXWZdRM94MklIJ2LaNdRW+lekIQaNjYB2pM1+ikxUZOZQ+hD2je1iXURPeDJJXXrG3QiF1p0YlZAM0S8upONPCCoWChJVXjr0C1fDee5P3rqiBAbtbi9SdBWCshXPcLK1X3tqDnz/8NN7eewRDoxn87LtfxLUbV538+pMv7cTW376It/ccQTpXwOMPfAtLe7rOeIzDfcP4/s8ewWvv7IOq6bh8zVJ85y9vQ3ND/OT3/OPW/8Tzr7yNd/cfhSSKePv/+1Gd/oXTEy2X0R0I4QBHY1j1VtJLeK3vNWzo2sC6lKryVovEsoCXX2ZdhW/l20JQOOfdbRXLKnq7O/G9v/zUeb++ZlkPvvGFWyb+eknBHf/jR+A44KF7vopHfvR1qLqOz3/rfpjmqbEgVddx/ebV+PRNl9fk31FN3XkVActbL3+32DW0C2OlMdZlVJW3WiTvvguM+mMlqdOYIo90xJlbw1+5bhmuXLfsvF+/5er1AICjAxMvWn1t134cGxzF4w98C7GIvR7j3q/fiZX/5SvY9sb72LS6FwDw1c/cDAD4zVPOH58TDANLjTB2itQNWW8WLLx85GXctOgm1qVUjXduSVQVeP111lX4VqY96NnTDlVNAwcOsnTqvisgi+A5Djvece/5E82FIuIeu5d0i/58Pw6Me2dWqXeCZOdOoOzdedpOpgdF5GTv9rdf1NuNcFDGD//XoyiVVRRLCn7ws0dgmCaGxjKsy5s5C1hCA+/MvHr8Vc+c9e6NIMlmgXfeYV2Fb6XbJFiOG2KvnlQyhvu/fRee2/4Wltz0JSz/yF8hWyhh2YLZ4DmOdXkVSZTKaLZoxTsLWSWLXUO7WJdRFd64HXn1VXuHX1J3akxGQfBua+SEzWuW4MVffh9jmTwEgUciGsaaT3wNN13RxLq0ii1WOAzTbvNM7OzfiYWphQiIAdalVMT9LZLhYVrBztB4s/svoeloTESRiIax7Y3dGE3nsGXDStYlVSxcVtBF55YwoRgK3hh4g3UZFXN/i+TNN1lX4FulhqArzhkplMo4dHz45P8f7R/Brn1HkYxFMKu1EelsAceHxjA0mgYAHDg6AABoboyjpTEBAHj4yZfRM7sdqWQMO9/dj+/e/zA+97GrML+r7eTjHh8cQzpXQN/QGEzTxK599kZ9c2c1IxJy9ht1T9HAsTBgubunzpXeHX4Xq9pWISg6+xqZDGe5+TzITAZ4+GHa3ZeRwe4Aypwzp/yebvub7+NTd993zuc/ds2luPfrn8VvntqGr93zr+d8/ct33IivfMaeovnDf3kUjzy9HZlcAZ2tKdx+02Z87mNbwJ02RvLX/+eD+H+e3n7O4/z6//oqLl21qIr/otrYnQjisAtuDLxodftqrO5YzbqMGXN3kLz4IrB7N+sqfEmJyxhodt7iQzJz5YCM34fod8pCUAzivy7/rxB5d3YSubeDu1gE9u5lXYVvZVPuvXTIxIKKinbL3YO+blXWy67e0NG97wbvvAMY3j/C0om0sIQiT10gXtSt0iAJK28NvgW3dhC5M0g0zd4OhTCRbXZn85tcWLRURiMk1mX4UlbJ4mD6IOsyZsSdQfLee7RNPCN6QECBTj70tB5VYF2Cb701+BbrEmbEfbeWpgm8/TbrKk66/4UXcM8zz2Agk8HKzk789LbbsG7ePNZl1UyuJQALtNGflzWUyojKIvLQWZdSUy88/AKe+eUzyIxm0LmgE7d97TbMW8b2tTtUGEJ/rh/tsXamdUyX+1ok+/Y55hz2/71jB776yCP42xtuwM5vfhMrOztx7U9+gqFslnVpNWFxQEF2/nRfUiEL6Da8vW3Kjqd34JF/eAQ3fOEGfPNX30Tnwk785C9/guwY+9funwb/xLqEaXNfkDhoT637nn0WX9i0CXdu3IglHR144PbbEZZl/MKjx/yWUkEYoAkOftBcUsG5c9x3Sp7d+iw2fXQTNt68ER3dHbj9b26HHJSx7TH2r90jmSNIl9Osy5gWdwVJOg2MTHxmRL2puo7XjxzBlt7ek5/jeR5bFi/Gdo9u2ZKPsa6A1Iuo6+iAe1daT0bXdBzZfQS9l5z52l28bjEOvOWM167bpgK7K0gctG5kJJ+HYZpojZ357toaj2Mg4+Ktxc9DDwgo0ZRfX+nSvDkVOJ/OwzRMxBrPfO3GG+PIjDrjtbt/bD/rEqbFXUGyz72HCLldoYkWqvlNvFSm43gZyak5DOQHWJcxZe65SgYHgVyOdRUnNUWjEHgeg2fVNJjNoi2RYFRVbVgA8kGabu03nGVhngd3BY4mo+AFHrmxM1+72bEsEinnvHb3jbnnxtk9QeKgbi0AkEURq2fPxnPvvXfyc6Zp4rndu3FpdzfDyqqv3BCA7vGpoGRibWXv/d5FScTsxbPx3qtnvnZ379iN7hXOee0eGD/gmhMU3REkpunIM0e+umUL/uUPf8C/bt+O9/r78cWHHkJBVXHnhg2sS6uqUswdlwmpvoCqIunBle5bbt+CP/y/f8D2325H/8F+PPT3D0Etqdhwk3Neu2W9jOPZ46zLmBJ3LEg8dsyR57HfunYthvN5fPuxxzCQzWJVZyee/NKX0BqPsy6tqooSdWv52SxDQlrQWJdRVWuvWYv8eB6PPfAYsqNZdC7sxJd++iXEU8567e4b24euRBfrMi7IHdvIP/88DbQzoiQCGGiiRYh+RtvLsyPxEu5YeYfjt5d3dnWAvUHjoUOsq/CtYtxr+y5xMCHB5GSYEGFBgmGJMC0RpiXAtHhYFgcLnD3LAPYf3Af/ZZ9jZYHnLQicAZ7TwXM6BGjgoYK3NAAqvDRxNqioCIcEFGkxat1ppobD6cOY3zifdSmTcn6QHD0K6N4b8HOLouzGO1EOOheGboWhmQHopgxVF6FpPIw6jV0KAiAJFiTJgCQokDgFIleEaBVwMqFcpMuU8T5Pm3WysH98PwVJxY4dY12Bb6lRCTqc3TduQYbCJaEaIWiGBFUToGkc87dqwwAMg0NZFWG/zCIAGsEBkCU7YGRRg8SXIVkZCHDeGODpmlUL73tvJrArHM8eh2mZ4DnnTnpxfpD09bGuwLdKCQlwWJAYXAiqlYBihFFWJCguW31tAVA0Dop2ImBCABogS0AwoCEgFBBAFoLDdliOKGXIQR4q3DEd1Us0U8NIcQQtkRbWpZyXs4Mknwc8upOuG5QC7PvETS6EstWAsh5GSRE928upaoCqSQCSAJIQRSAc0BAQSwhwGQgW4x2vLaDDCuAQR91bLPTl+ihIZoxaI8yYPAeVYzNby+AiKJmNKJTDKPv06FddB7K6BEACEEdAthAJlhDixyBaeSY1NerAIe8tKXGFvlwfVrWtYl3GeVGQkAmpcRkW6hckOhf7IDyCUHwaHpNRVA6KGgYQRkCyEAmVPwiV+m0bFFd1eHBtoisM5AccPU5CQUImVI7WftqvgTAKZjPy5RA0Zw3FOJo9xhICMOu0UBmteUsloGkIWDwUjsZJ6k03dQwVhtAWbWNdyoScGyTZrD1GQphQ5NqMj1gAVK4ZOSWJQslra1Tq71SodCIcNBELpBHEMGo1xbgFEo7WsaVKTunP9VOQTBu1RpixeA4KV931IyYXQNFsRbYYhubRAXPWimUexXIjRLER8XAREX4QvFXdN/2UzuModW8x0Zfrw0XtF7EuY0IUJOQcSqx64yMq14i82oh8UWS+tsMvdB0Yy4YxjnmIRnREpRHIVroqj53QDRonYWSwMOjYcRIKEnIOJVJ5l5OCZqRLjb6ddeUEFoBcQUQObQjIrUiExhHCUEWPGVRViCEOOt0W1J2Tx0mcGSSlElB01oIsP9Hkmb9JKEghXW5CWaEAcRJF5TCkNiIgNyAZGkUQIzN7IAtohIQhuHHrHPcbzA9SkExZOs26Al9ThekPYihIIVNOoaQ4r9lNTlFUDoNqE4KBFJLBEQQwOu3HSJgChujXzES6nGZdwoScGSTj46wr8C2Lw7T211LRgLTSjFKZ3lncpKxwGFCaEQqm0BAchmRN/TUXMzm3HInnORQk00EtEma0iAxrCt0WBhfBmNKBIk3hdbVSmUep3IpwqAkNgYEpLXCM6IZT3zk8j4JkOqhFwowanjwYLAjImZ1I50I03OohxZKAYmkWkrEy4vxRcJOcPRLQdIB2AmZCMRSUtBJCUoh1KWdwZgOVWiTMaPL5v6agGf2FBRinEPGsdC6IvsIClLnzbxAoGAZCFrVEWXFiq8R5QaKqQIHxTqc+pkrnRoTJhTCqLcBAJkWLCX1A14HBdCNGtQUwuYnvfBsc2pnhB04MEuddDdQaYUrnT08KDnmrE+PZCExqgvhOviigWJqDhlgeUe44Tt92JW4J6KMZ3kyMl53X9U9BQk6yABiwg0TnYhgpdtBOvD5nWsBoNoq8vBCp8AAkKwMACJlwYn+GLzixReK8S4EG2pkxAgIsAEWrE/2ZWRQi5CRF5dCfbkfe6oIFIEBNVGYoSKaCTkRkRgkEMaIuwHA2Sl1Z5BwWgNFsBCPqQggGbbjFSl7NQzedNVjpvCApl1lX4EulYCf6hYtoa3dyQcUSj7HxLgSt2axL8a2y7qz3SecFiUJnHdSTBR7j4VUYKi8F9WSRqbI0E0q2F2H9IjjxbcTrFN1Z75POuwIoSOrG4IMYCmxEttj6wf/X5jAr4kUWJMtCMd8CuXQZBIRZF+QriuGs90kKEp9SpUYM8BtRVk69AVCQkOkIcPb1oipBcLlLIaOJcUX+oRrO2n3ZWUFiGPZqKFJTpWAXBo010PUzZ38bk2yLQcjZZOvU9aIbIrTsxQhacxhW5B/UtTUZao3UXDa8FEPlJTDNcwdELI6mapGpE866XiyTQzmzGGFjKaOK/IO6tiZDQVIzFniMhNZhvNh5/u+xKEjI1J1vbkYx14mQtg5Oe3vxEuramgwFSU2YnIShwEYUSg2Tfx/MOlVEvICb5MajVGhAoLQJPCbZBZTMGHVtTYaCpOoMPoAhacMZg+rnQy0SMh38BfaAVpQQxOIG8LTnfNVR19ZkKEiqyhBCGBIvhaJO7YVMYyRkOrgpHCagqgEIhUtpenCVUdfWZEzqWqkWXYhgkF8PVQ1M+e9Qi4RMx1SCBAA0TQZfWA8R0RpX5B8UJJPhnVWOW2liHIPcemiTnVI1AYuOqyLTwE/jctE0CchfAhHx2hXkIzznrPdKh1XjrHLcSBPjGLTWnbNGZCpMi1qEZOqm2iI5QddFWLl1kJCsTUE+QkEyGQqSihhCGENYC8OY2caL1CIh0zGTITXDEGDlVlM3V4UEzlmbqzrrnZuCZMYMPoBBYWYtkRO4864MIGQiM7vx0A0RXGEdzeaqgMBTkJyf4KwfjluYnIhhcT20aQysT8RpzWXibGYF14umSRCLl4Cz6FyTmXDaa9Vh1TirHDewwGM4sH7KU3wn47SLkzibWeHbh6oGEVAugdPehtyAurYmQ0EyLRY4jIbWoVyOVOXxqGuLTIdRhculXI4gpK4DLLr2poO6tiZDXVvTkg6vRKGUqNrjCaCfP5k6o0o3HqViAiH94qo8ll84rffAYdU4qxwnK4S6Tx5IVS3UIiHTYVSxe6VUaELIXFC1x/M66tqaDAXJlKhyE0bLPVV/XN5hlwNxtmqfXlPKdUNGS5Uf1Zuoa2syoRDrChzPEEIYNlfCqkGfMkf91GQajGq/fViAkVtB+3JNgcQ7a7ab84KExknOywKPYXFtRWtFJkNjJGQ6jBrceBiGALG0Bk57a3KaqOysBZ3O+21FqjMDyYvGQxdDUWrXauMt510OxLk0rjYtWEUJIaTR4PtkKEguJOqsH5BTFELdyJVSNX0O0ahNS4d4EM9Dq+GNR6mQosH3SVCQXAi1SM6hi1GMKfNr/jyCRl1bZGossfZ99OX8PEhW9aa3ewXP8QhLzhpHcl6QUIvkDBY4jAoXwTRr/6uiICFTZdQhSCyTA1deBSe+TbEUkSLgatStOFPO+w1RkJwhG14ypWNyq0FQKUjI1OhCfbpBVSWIsLGsLs/lFk7r1gIoSBxNlZuQKXbW7wktQOandxgW8SeVq994WjHfTutLTkNBMhU0RgLA3tF3xFpe9xNCxDq+QRD3Uvk6XicWYBaWgQNdmwAFydRQiwQAkA6unPZRudUg0bbeZApKdV5zpGsSgtqquj6nU1GQTIUs2x8+psjNyJWamDy3aNJdH7mwslX/8bRSIYUA2ur+vE4TC8RYl3AO5wUJAKRqu17CySxwGMNSZs8v1mjVPPEQUazazr/TZRUXw6lvW/WSDCZZl3AOZ/5GfBwk+dAiqBWedFgJqURdW2RyhszuiFxVDSBsLmb2/KwFxSB1bU1ZE5tuHdYMIYy00sW0BkERHLdFNXEWRWR3owMA5XwnBMufk3Kaws58b6QgcZBxeXldFh5eSJBjd8fpNP/+xL/j1j+/FVffdjX+/Bt/jvf2vse6JOYKHNtWq2lykLXlTGtghYJkOpJJ3+0CXA50oFBKsi4DABAw2d5xOsXzLz+P+x+8H5/55GfwL/f8C+bPmY+7/+5ujGfGWZfGVJZxkAD2qYpBaxbrMuqOgmQ6eN53rZIxayHrEk6SVX/Pmjvh4f94GDduuRHXf+h6zO2ai7++668RDATxn8/9J+vSmLEkqaabNU6HUVzou7Pem8PNrEuYkDOuiIm0VvcYWScrhLqhMRxgPxsNuAOapmHP/j1YvWL1yc/xPI/VK1Zj155dDCtjS5edc/icpskImrXfzNQpwlLYkVN/AQoS5izwSGtzWZdxBl7jfb/CPZPLwDANNCQbzvh8Q6IBY+kxRlWxVxad1VrVS3Pg5LexamqNOPc90bm/AZ8EST7UA113XgsgxDnnzpM4Rx4OCxJdRNh0TrdwLbVFnbsY07lBEg4DMWc246rF4gRkNLbTfc8nYDinq42FRCwBgRcwnj5zYH08M47GZCOjqljjkHPgfldKodMX+3C1Rp17c+3cIAGA9nbWFdRULrQIhkNXkgeK/g4SSZKwcP5CvP726yc/Z5omdr61E0sXstt5gCUjFILJaEX7ZAxDQMhYxLqMmhJ50bEztgCnB8ncuawrqBmTk5BVOliXcV5iSYTEO6/LrZ4+edMn8fizj+PJF57EoWOHcN/P70NJKeG6D13HujQmig47le905UIHeId1u1VTZ7wTPOfct2tn3g6f0NlprycxDNaVVF0+tBBG0dlrZSJWBGmkWZfBzIc2fgjpTBq/+LdfYCw9hp55PbjnW/f4tmtr3MELVU2TR9hYhKLwNutSamJuci7rEibFWZZV7yMvpufJJ4EjR1hXUVUWeBwXr3Rst9YJSlzBgDzAugziAJYk4/2ws7uaBcGAGX0BFuetG08OHO5YeQeConOD3LltpRM82L1VCHU7PkQAQM7Ljm5Ok/pRgs7f28owBASsbtZlVF1btM3RIQK4IUhmz2ZdQdVljToen1sBzuQQ5pzbL07qJys4+43sBKPkjtfWdDi9WwtwQ5CEw0CLd85rLgU6HLWK/UJCOq0n8T1ewLjljoFsTZMRtLwVJhQk1eKh7q0cN5d1CdMSzLvjTpTUjh4Mw9kDqWdR5rCuoGoaQ42O3RbldO4IkjneuDA0MY5S2fkXxel4lUeQpzDxs7zkrlZpuRyFZCVYl1EVbmiNAG4JkoYGIB5nXUXFCvI81iXMSFR33olspE54HsNw342EZHhj0J2CpNrmufNN+HQF1bkrUycTzobBOXBFM6k9NRRjdj57JZRSyvVbzEflqKNXs5/OPUGy2N3nNJcDHdBdMOV3IpzOIcI7f/onqb4x0Z2z9gxDQBDuPvhqYco9m1G6J0gSCWCWey+MPOfe2gEgWqbuLb+xpADSLt52hNPc+5rjwKG3qZd1GVPmniABgCVLWFcwIyYnoqQ2XPgbHUzOyhB5d7aoyMwUQu6+eSiXE+Asd+4XNyc5BxHZPb0A7gqSOXPsdSUuUwrOhmm6u7+WA4eY6a4ZZ6QSHIZ5973WTmeZHIJw54zPJc3uuml2V5DwvCvHSvKWc3f5nY5I3j13SKQyeigMxSFns1fCUpx7GNT5JAIJdMbdtajSfVdKby/Auefu3uCDKJe98QYslAWEBHetKSAzk3HBIripKJcjEOCulpXbWiOAG4MkEnHVAsVSwL0DfhOJK+5fz0MuQBQxYrlnG58LkUz3vAZFXsSiJvcd0uW+IAFcNehesppZl1BVgXTA9wdeeV0unHTXligXorljLQYA9DT2QBbcN1POnUHS2emKle4WeJRVb3QRnMCBQ1JLsi6D1IogYMBjOz4rSgxueatzY7cW4Jaf7kSWOv/cbEVuhWm690d8PuF0mKYCe1QhnHTlSvbJWCaHoOXsQ7kAoCXS4pqV7Gdz77tcb6/jpwKXRPfNGJkSC0gaSdZVkGrjBfR7dAcDTnf+URQXt1/MuoQZc2+QiCJwsbN/8CUPdwGFx8MQOGefOU+mpxSJQ/dYa+QE3eELgtuibZidcO8hfu4NEsBeUxJz5hiELsagae4bNJsqzuSQ8MhW3QQAx6Ofd/dK9slomgTRcu646rpZ61iXUBF3BwnPA6tXs65iQmWplXUJNRdJR+hMd49QonGoLn87uBDJcmZXc1e8C21RZ9Y2Ve6/chYssM8rcRgFSdYl1Byv80j64N/pfRwGBGe27KvKoeN6a2etZV1CxdwfJBwHrFnDuopzKIZ3uwlOFx2L0liJy5VjCZQ8sB3Kheiq8yYSdDd0u3am1um8cfXMmwc0OeeXYfIyNNU7K4MnwxkcGgzntQjJFPECjvuhNQJA02TwDlqxz3M81na4vzUCeCVIAGCtc34hiuScUKuHyHgEMu/diQVelo82QvNBa+QEGc7ZaWJhaiESQW9MWPHOFdTVBbQ7Y9GRKqRYl1BfFtCoNLKugkyXJOG4x1axXwhvOuM6FTgBq9udOVFoJrwTJABw6aX2TC7GyoZzpxnWSiAToON4XWYkkvLWnlpTYGjO6MZb3rrcVQdXXQj7d91qamoCli9nXQU03Z9brTdkG8B5dEGb1xjhqKd2+J0qTWXfAksEEq5exT4RbwUJYK8rYbiho8EHYRj+nMUklAWaDuwGHI/jUpJ1FUyYJg/BYtsS2Dxns+f2qvNekIgisHkzs6fXfPoCPSE2FvPci8RrSrEkivDnzQ4AiGA3wN3b1Iv2mDPGcqvJe0ECAB0dzI7k1Xln9MGywpkcmkr+mrXmJpYcwBHO39cob7H590ekCC7pvITJc9ead28d168HjhwBisW6Pq3G1Xch4it7XsHPn/453j7yNoYyQ/jZF3+Ga1dde/LrT+58Eltf3Iq3j7yNdCGNx7/1OJZ2nbkF/+Hhw/j+I9/Ha/teg6qruHzp5fjObd9Bc/zcqZKKpuCjP/wo3jv23oSPBQCBXADJYBJpK131fy+pBIe+cBOsCUbY97z1Cp5++Oc4svdtZEaH8MXv/gyrNp66jna+9CRe/O1WHNnzNgq5NL71wOPo6jnzdz/cdxiP/Oz72PfOa9A1FUvXXI7b/vI7iDecuo4K2TT+7R//Fm/98TlwHIeLL7sOn/yLv0UwVL/uJs6MMLmFvmzOZa48tGoqvNkiAQBZBjZurPvTamZ9B/OKahG9nb343qe+d96vr+lZg2/c8o2Jv64UcceP7gAHDg999SE88vVHoOoqPn//52Ga5jnf//eP/j1akxfeRyw+Gqe1JQ5TiDciZ01876iWi+js7sWn/nLi60gtF9GzbA1u+cLE15FSKuJH/+MOgOPw1Xsewtd/9Ah0XcX93zrzOvq///7L6Du8B3/1f/wS//1//gJ7334Vv7rvbyr/x02Dqdd/wL2nscfVu/teiHdbJIC94n3uXODQobo9pabXdybMlcuuxJXLrjzv129ZfwsA4OjI0Qm//tr+13Bs9Bge/9bjiIXsJv+9d96LlV9ZiW3vb8Om3k0nv/eFd17AS+++hAfuegC/e+d3k9bFmRyaCk3oC/VN819EasEMhnCUO/9d/7J1V2LZuvNfR+uvtq+jkYGJr6P9u17D6OAxfOuBxxGK2NfRnV+/F1/5Lyvx/hvb0Lt6E/oP78OuHb/H39z/GOYuWgEAuPUvvoN//Oad+Phd30SyqT4bnep1fo0GxSA2dG2o63PWm3dbJCds2mS3TurA4gTourvOM1c1FRzHQRZP/YwCYgA8x2PHvh0nPzecHcbf/PJv8A93/gOCcnBKjy0VJDTCGQvAfI3jcSyQAmo4NVvTVHDgIEqnriNRDoDjeOx7x76ODry7E+Fo/GSIAEDv6k3gOB4Hd79Rs9rOpusiuDreQ2/o2oCgOLXXjFt5P0jC4brN4jIE9nPUp+ui7osQlsP44aM/REktoagU8YNHfgDDNDCUGQIAWJaFux+8G7dvvh0r5q64wCOeKTYaQ5D39ovI6TLxxprP0uruvQhyMIxH/9cPoZZLUEpFPPKzH8A0DWTG7OsoMz6MWPLMiRiCICISTyI7NlzT+s4moj5jmfOS89DT2FOX52LJ+0ECAN3ddVmoaPDuW4iYiqVw/13347m3nsOSLy3B8r9ajmwpi2Wzl508a+TBFx5EoVzAf7vuv03/CSwglUvRuSWMGOEI+lH7gexYMoW7vn0/3tr+HL500xL81UeWo1TIYvaCZeAc+LvnrNq/VpPBJC6fe3nNn8cJvD1GcrpLLgGGh4GBgZo9hRuDBAA2L9mMF7//IsbyYxB4AYlwAmu+tgY3Nd0EANi2ext2HtiJhX+x8Iy/d/MPbsZH1n0E991536SPL5ZENIYaMcKP1OzfQCYgiDgiN6Je+6AsWbMZ3//li8hnxsALAsLRBL72iTVousK+jhINzcilz7wGDENHIZtGvLG+mykKqO04icRLuGb+NZ6dpXU2/wQJzwNbtgCPPlqzKcEG5+4tJxqj9njGtt3bMJobxZaVWwAA37ntO7j7I3ef/L7BzCD+7Md/hn/8wj9i1bxVU3rsyFgEaouKrJmtet1kIhwGYs1QGOzsG03Y19HuN7Yhlx7Fyg32ddS95GIU81kc3vM25iy0ewjef2MbLMvEvMUX1bdIM4ha9vZdPvdyJIPJ2j2Bw/gnSAB7vGTLFuC3vwUmmNpaKZNBkBTKBRwaPnTy/4+OHMWuo7uQjCQxq3EW0oU0jo8dx1Da7qc+MHAAANAcb0ZLogUA8PDLD6OnvQepWAo79+/Edx/+Lj531ecwv20+AGBW46wznjMcsMeCZjfPRnvD1FfpJoeT0Jo1lMzSjP+9ZGqyiSakranfDZdLBQwfP3Ty/0f6j+Lovl2IxJJobJ2FQjaNsaHjSI/a19HAUfs6ijc2I9FoX0cvP/kw2mf3IJZMYf+7O/Hw/d/FVR/7HNq67OuofU4Plq69HL+87xu4/a++D0PX8euf/i3WXHFT3WZsncChdi2Fla0r0d3QXbPHdyLOsiZanuRx77wDbNtW9YcdC61Grs6rure/vx2fuu9T53z+Y5d+DPd+9l78Zttv8LV//do5X//yjV/GV276CgDgh4/+EI9sfwSZQgadqU7cvvl2fG7L58BxE8/yOTpyFJd987LzLkicjCmZ6G/oh27q0/p7ZOqUaBIHheltA/L+m9tx393nXkeXXvMxfPbr92LbU7/Bv95z7nV04x1fxk2fsa+jR//lh9j+9CMo5DJItXZi8023Y8vHzryOCtk0fv3Tb3+wIJHHxZd9GLf+9+/UdUEiAITCoyjJr1X9cTtiHbhhwQ3nfe14lT+DBACeew7Yv7+qDzkcWo9iyRsH1dSSFtHQH+qH5btNzGvPDIaxN9BMP9kLCIayKAe2V/Uxo3IUt/Te4vmpvhNx3nSKern8cqChukfEmqa71pCwIhUkNBvOOanOM0QJhwJNFCJTYFX5tSpwAq7uvtqXIQL4OUhEEbjmGiBQvXENy0dHllYqNB5CgqPWW9VwPPqizVDpPJgpqfZrdePsjWiO+PfmyN/vfIkEcN11gFSduxOfdhLOWHIkibALF3E60XiiGVmLWsRTZVnVC9zV7auxuInNbuNO4e8gAYCWFuDaawGh8rmAFv04p8cCmoabEHLp+hunyCaaMWj5s0tlpqwqtdxWtK7A6g7vnL0+U/TOB9jnl2zZUvF579W8y/ELzuTQPNpM26jMUD6RQh+oVTdtVXitLm5ajPWd66tQjPtRkJwwZw5wxRVARdP2KEhmgjM4tIy1IMC7e0FnvZXijThWpz2jvMassBu6p7EHl82+rDrFeAAFyel6eio6w4RaJDPH6Rxaxlsg8dTPPxXlWBKHfX7SYUUqGGyfk5iDK+Ze4bu1IpOhIDnbkiXAunUz+quWSRdWJXiNR2umlc58vwA1msAhnma8VWZmr9VZsVnY0r2FNiE9C/00JrJqlf0xXZQjFRMUAW3ZNogchclEtEgcB6a5ap2cayY9W62RVlzbcy0EvrZb8rsRBcn5rFsHrJje2RscR/N/q0EoC2jNU8vkbHokhgNiA+iOpXLcNKOkKdyE6xZcR9fkeVCQTGb9evtjijiu+htB+pVYEtGWaaNz3z+gxJLYJzbSqvUq4fmpv1a74l24aeFNvtkSfiYoSC5kxQrgqqumtM6EgqS6BEVA21ib79eZ5OMpHKQxkaqa6mt1cdNiXNtzLSSBJoFMhoJkKubPB66//oJnv0/nLodMDadzaB5pRpT34zRXDulEC45xfvy319ZUuqHXdKzB5jmbaWB9CugnNFXt7cBHPgJEzr/dNbVIaoMzOaSGU0j46a6c4zGcbMMA/N0aqxWOM877NZ7jccXcK3Bx+8V1rMjdKEimo6EB+OhHgcbGCb/MgYKkZiwgOZREIyb+2XuKIKA/0YbRaRxMRabnfDd9Ei/hwz0fxsLUwgm/TiZGQTJdkQhw8832tipn4Se5yyHVERuJodlsBufRmUuWJONorB0Z2oCxpjj+3NdqWArj5kU3ozPeyaAid6MgmQlZtsdMFp5518KDTv2rh/BYGO2lds+tgtfDMewLt6Fg0TqFmjvrpq8x1IiPLv4oUuEUo4LcjSZFzxTP23tztbbax/YaBgROZV2Vb0gFCe1KO0YbR1EwC6zLqRCHXCKF46jvcbN+xvHKyf9emFqITbM30RqRCtBPrlK9vUBzM/DssxC0MutqfIXTOaSGUgg2BTGKUdblzIwooT/SjAy81bpyOotTIPIiNnZtxKKmRazLcT3/ntlebaqK4st7MLyXNtJjQY2pGAoOwbDcM05lhCI4LKfoVEMGWlr6sLlnERpDPpi8UQc0RlItsozyymU4GGqERbuC1p2ck9GeaUdIcMd02WK8EXspRJgI6VFsbL+EQqSKKEiqKBoF9pRieFVsh3KBxYuk+gRVQMtQC1JIOXdWlyRhKNmOI1wMtGdWffHgEcw0o3Q4hViU3vqqiX6aVSTL9kdak/Ci2ob+cAL0ZlFnFhAdiaKj0OG4rVXKsQbsDbdjjNaH1F3QDIE71o7ySBiiCATpQM6qosH2KovFgNFRwASHt4pJHJXCWM6PIaQoF/7LpGrEkojmUjOKjUWMCWMwLXaLRS05gIFQigbUGRAgQMo0ojxy6jjiGA1jVh21SKrs7It0XJPxktKKw6FGWBWeCU+mhwOHyFgEHdkORHgWU2s5FOMp7Am1UYgwENJisA53nBEiAAVJLVCLpMoSE2wHZYHD7lIMR4UQVgbHECuX6l+YjwmKgKahJkQaIhgVR+sys8sMhNAXakTeopdYvUmQwI80opSZuP8qHq9zQT5AV3mVNTWd/2sFQ8Q2owVzgkXM18ch6bQSvp5C4yF0SB3INmSRNbOwanG6hygiG2lAH0KAReNj9cSDR7AUR7E/PunPfrLXKJkZCpIqa26+8PccLodxFCEsDOXQqWYhGO5Z++B2vMYjOZRELBhDJp5BzsxV6YF5FKMNOM5FYNAEizrjENaiKPcnUNQuvL0MBUn1UZBUWTxuz9xSL7BbigkOu0txHOCj6A1l0FrOgaO1oXUjlAU0lhsRi8SQjqZRNIozfCQOSiyB43yc1oQwEDIi0AYTKJamNgYlivYm3qS6KEhqoKkJ6Oub2veqJo8/lRoQEWJYImfQWMrXtjhyBqkgobnQDCWuYDw4DsWc+uw6PRJDn5hAEbTJYr0FrCCskSRK2cC0/l5TE0DrhauPgqQGmpunHiQnFAwRO0opJKU4FohZNJYKAJ3QXTeBbACt2VaUG8oYl8ahmdp5v9cIRTAUSNBW7wwEzSCs8QSU9MwWgkyl65lMHwVJDVRysaY1CTu0FMJCEosCWTSX8+BMOjCrHjhwCI2HEEQQSkJBJpBB2Syf/KoWiWFIiiFniZTxdRYyIjBG4ijnK1vMSUFSGxQkNVCNwbyiIeCNYgNkPoEFoRza1RwNytcJBw7BTNAOlLiOozEDfSEJJYunAKkjDhyCahTaSBylUnXeqmigvTYoSGogHgcCAaAai9lVk8euUgK7uTi6QwW0G3mEVFolX2uaJKFPimJ/Lgoty0MMaQg15aHIeZh0pHJNSZAglSIoD0dRmsIsrKmSZSCZrNrDkdNQkNRIczNw7Fj1Hs+wOOwtRbEXUTRIKuaKBaTUArVSqsjiOKQDYRxHBMfLIeC0YRK9JEE/2gCOTyDUVIQVLaDM0fkz1cKBQ1APw0hHoWaCOP8I1cxRa6R2KEhqpKmpukFyunFNxrgmg0cSs0NFdFp5RMr0pjZThUAQA3wEh8thaOXJt7GxTB6loSgwFIUQ0CGnCtBDBWg1eevzPtkKQChGoIxEUNJru4UQjY/UDgVJjcyaBbz5Zm2fwwSHQ6UIDiGCiKCjSy6hySoiUlZAnfmTUyUJQ1IEh9UI8srMXgaGIqLUlwCQgBxTISYLUOQCDFArcTKyFYBYDkFLh6EW6zfzrb29bk/lOxQkNdLePrWFidVSMETsLsUAxBDgDXQGSmixSogpJVroCLvbqhAIYpQL4bgWQk4TUc1GhJqToeZkAA2QoyrERAlGoASFo/EsgEPADIAvhqGmw1AVAXV6WZwkivbNHakNCpIa4XmgsxM4cKD+z62YAvaXotiPKETOxKxgGU1cGTGjjIDqny4YXRSQkUIYskLoU4LQL9BtVS1qXoaalwEkwEsGAskyEClBEUq+GagXLQmSHgCKQSjpEJQad1tdyKxZgEDrRmuGgqSG5sxhEySn0y0eh8thHIa9lXaQN9AqK0jxCuJ6GYF6NZnqQJFl5IUA0pAxrAeQ0SSA8b6YpiagNBwBhu1t7KWICjGqAkEFuqh4ZmxFhgxBDcAqBqFmA9A1gfWP/gxz5rCuwNsoSGqoq8vejsFJPUtlUzgjWGTeRLOsIMFriFoqwoYGWdMc3x2miSIUUUKWD2DUkDGsBqCpzj/vRSvI0AoygCgAgJcMSFEVQkSBKakweB0adDh1jIsDB8mSIRgSOFWCUZag5QJQGbc4LmT2bNYVeBsFSQ0Fg0BrKzAwwLqS81NNHsfLIRzHqWNpOVhISDqSooo4pyFs6ZBNHZKuQ6zjdGOT56EKIkqChBIvIWeJyOoSMroEQ+eYtzaqwdQEKOMhYPy0Y4E5C1JIhxDSwAc0WJIGQ9BhcgYMGLXZ/v40HDiIEMGbAnhTBKeLMMoSjKIEvSTVfXyjUs3NQDh84e8jM0dBUmOzZzs7SCZigUNak5DWzp1Rw8NCWDQQ5g2EeANBzoDImRBg2R+WBQEm+A/+5Cz7aAjT4mBxHCzOfnzTsgfADY6HCgGKxaNsCSibAkoGj5IhwDQ5wERVB8VdweKgFSVo55nRxIsmBNkALxngJBOcaIATTICzAO6DmPngvwELJzcltjhwJv/BL4QDLA6WyQMmB1MTYKoCDFWAqfOe+pFTt1btUZDU2Jw5wKuvsq6iekxwyOsi8nTpMGPqPEydB+j43imhIKk9Z3dsekBDA50RTQgr0SiQSrGuwvsoSOqA7ogIYYMG2euDgqQOurtZV0CIP82bx7oCf6AgqYO2Njrek5B6i8dpNXu9UJDUSW8v6woI8ZfFi1lX4B8UJHWyYAFt0UBIvfA8sGgR6yr8g4KkTgIBGishpF7mzQNCoQt/H6kOCpI6ou4tQuqDXmv1RUFSRzToTkjtJRJARwfrKvyFgqTO6E6JkNqi11j9UZDU2cKF9iE7hJDqEwT7NUbqi4KkzmSZBt0JqZV58+xdt0l9UZAwsHw56woI8aZly1hX4E8UJAykUrR1AyHVNns20NLCugp/oiBhZPVq+/REQkh1rFnDugL/oiBhpLGRxkoIqZa5c4GmJtZV+BcFCUPUKiGkchxHrRHWKEgYSibtPbgIITPX3W238Ak7FCSMXXyxvcEcIWT6qDXiDPQWxlg8TguoCJmpBQvsLVEIWxQkDkCtEkKmj+ftcUbCHr19OUA0SvsDETJdixYBsRjrKghAQeIYa9bQ+QmETFUwCKxdy7oKcgIFiUMEAsCll7KughB3WL+e9tRyEgoSB+npAbq6WFdBiLPNmkUTVJyGgsRhNm2ibeYJOR9RBC67jHUV5GwUJA4Ti9G8eELO5+KL7SnzxFkoSBxo+XLaN4iQszU2AitWsK6CTISCxIE4Dti8mfbhIuSEE68JWm/lTPRrcaimJjoAi5ATli6ls0acjILEwdasoQVXhESjtGbE6ShIHEwUgauuouY88S+eBz70IUCSWFdCJkNvUQ7X0kILFYl/rVsHtLWxroJcCAWJCyxdai9WJMRP5s2jWVpuQUHiEpddZh+ERYgfJBLA5ZezroJMFQWJS0gScPXVtOqdeJ8o2te6LLOuhEwVBYmLNDTYc+kJ8bJNm+joXLehIHGZnh5gyRLWVRBSG4sX04aMbkRB4kIbNtDiLOI9TU3Axo2sqyAzQUHiQjwPbNkCRCKsKyGkOkIhe1xEEFhXQmaCgsSlolHg+uvtA7EIcTNZtq9l2sXBvTjLsizWRZCZGxoCHn8c0DTWlXjPCy/cj2eeuQeZzAA6O1fittt+innz1rEuy1NE0Q4RWnTobtQicbmWFuCaa2gblWrbseN/45FHvoobbvhbfPObO9HZuRI/+cm1yGaHWJfmGSe6aClE3I/efjxg1ix7PyLadr56nn32Pmza9AVs3HgnOjqW4PbbH4Ash7Ft2y9Yl+YJHAdccQUwezbrSkg1UJB4RHc3HUFaLbqu4siR19Hbu+Xk53iex+LFW3DgwHaGlXnHxo207Y+XUJB4yOLF9iZ3pDL5/AhM00As1nrG5+PxVmQyA4yq8o41a2gtlNdQkHjMqlW00R1xruXL7XPXibdQkHjQ+vX2jsFkZqLRJvC8gFxu8IzPZ7ODSCRoZHimenvpSASvoiDxqI0b6c5vpkRRxuzZq/Hee8+d/Jxpmti9+zl0d9M74UysWkVjeF5Ge8l62Jo1QDAIbNvGuhL32bLlq3jwwc9g7tw1mDt3HZ577kdQ1QI2bLiTdWmus349dbd6HQWJxy1bZq9+//3vAdNkXY17rF17K/L5YTz22LeRzQ6gs3MVvvSlJxGPt174LxMA9hTfzZuBRYtYV0JqjVa2+8TRo8Czz9IKeFIfoghcdRUwZw7rSkg9UJD4yMgI8OSTQLHIuhLiZeEw8OEP27v5En+gIPGZfN4Ok7Ex1pUQL2poAK67zt5UlPgHBYkPqSrw3HN2dxch1TJrFh2R61cUJD725pvAa6/RIDypDMcBq1cDF11E+735FQWJzw0MAM8/b3d5ETJd4bA9qN7ezroSwhIFCYGiAL/7HXD4MOtKiJt0dQFXXmmvVSL+RkFCTnrrLeDVV6mri0yO54G1a4GVK1lXQpyCgoScYWjIHojP5VhXQpwoGrW7slppXSY5DQUJOYeq2l1dhw6xroQ4ydy5wOWX2zslEHI6ChJyXvv2AX/8Iy1g9Ltg0N4va+FC1pUQp6IgIZNSVWDHDuDddwG6UvyF404dlkatEDIZChIyJSMjwEsvAcPDrCsh9dDUBGzaBLS0sK6EuAEFCZkyywLee8+e2aWqrKshtSDL9oysJUtocSGZOgoSMm2lEvDKK8CePawrIdW0YIE9FhIKsa6EuA0FCZmx/n5g+3a724u4V2MjsGED0NHBuhLiVhQkpGKHDwM7d9L4idukUvZxzPPmsa6EuB0FCamao0eB11+3FzUS52putgOEDp0i1UJBQqru2DG7hTIwwLoScrrWVjtAurpYV0K8hoKE1Exfnx0ofX2sK/G39nY7QGbNYl0J8SoKElJzAwP2gsaDBwHDYF2NP/C8vaXJ0qW0xTupPQoSUjeKYm+78v77NNOrVlIpYNEioKeHtncn9UNBQpgYHbUDZe9eO2DIzAUCdnAsWmSvSCek3ihICFOGYU8f3r0bOH6c9vOaKo6zxzwWLbK7sASBdUXEzyhIiGMUCnaoHD1qh4qus67IWUTRHu/o6rLDIxplXREhNgoS4kiGYQ/SHz1qf4yPs66IjWTSDo6uLjtEqOVBnIiChLhCPm+vTzlyxJ5O7NVNI2XZ3qrkRHhQq4O4AQUJcR3TtAfrR0ft2V+jo8DYGKBprCubHlG0Z1mlUvZ+V01N9gfPs66MkOmhICGekc2eCpYTH4UC66ps0agdFieCI5UC4nHaqp14AwUJ8TRFsbvFikV7+/uJ/iwWZ95VFgjY266Hw2f+efp/x2J0wiDxNgoSQmAP7pfL9p+WZXefnfgTsLubOM7+4Hm7WyoYpG4oQgAKEkIIIRWi+ylCCCEVoSAhhBBSEQoSQgghFaEgIYQQUhEKEkIIIRWhICGEEFIRChJCCCEVoSAhhBBSEQoSQgghFaEgIYQQUhEKEkIIIRWhICGEEFIRChJCzmP//v2466670N3djWAwiHg8jo0bN+LHP/4xSqUS6/IIcQyRdQGEONHjjz+OT3ziEwgEAvizP/szLFu2DKqq4g9/+AO+9rWvYdeuXfj5z3/OukxCHIG2kSfkLAcPHsSKFSvQ2dmJ559/Hu3t7Wd8fd++fXj88cfx5S9/mVGFhDgLBQkhZ/niF7+IBx54AC+//DI2bNjAuhxCHI+ChJCzdHZ2IhAIYP/+/axLIcQVaLCdkNNks1kcP34cy5cvZ10KIa5BQULIabLZLAAgFosxroQQ96AgIeQ08XgcAJDL5RhXQoh70BgJIWeZNWsWQqEQ9u3bx7oUQlyBWiSEnOXGG2/E/v37sX37dtalEOIKFCSEnOXrX/86IpEIPv/5z2NwcPCcr+/fvx8//vGPGVRGiDPRynZCzjJ//nw89NBDuPXWW9Hb23vGyvZt27bhN7/5DT772c+yLpMQx6AxEkLOY+/evbjnnnvwzDPPoK+vD4FAACtWrMBtt92GL3zhCwgEAqxLJMQRKEgIIYRUhMZICCGEVISChBBCSEUoSAghhFSEgoQQQkhFKEgIIYRUhIKEEEJIRShICCGEVISChBBCSEUoSAghhFSEgoQQQkhFKEgIIYRUhIKEEEJIRf5/u7WnJ2QGSiUAAAAASUVORK5CYII=",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "venn3([\n",
    "    set(train_1['smiles'].tolist()),\n",
    "    set(train_2['smiles'].tolist()),\n",
    "    set(train_3['smiles'].tolist()),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_1.to_csv('../../data/hi/drd2/train_1.csv')\n",
    "train_2.to_csv('../../data/hi/drd2/train_2.csv')\n",
    "train_3.to_csv('../../data/hi/drd2/train_3.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_1.to_csv('../../data/hi/drd2/test_1.csv')\n",
    "test_2.to_csv('../../data/hi/drd2/test_2.csv')\n",
    "test_3.to_csv('../../data/hi/drd2/test_3.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "lohi_benchmark",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.9"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
