{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "WARNING: You need at least 120GB of RAM to execute the code for the full dataset\n"
     ]
    }
   ],
   "source": [
    "from IPython.lib.deepreload import reload\n",
    "%load_ext autoreload\n",
    "%autoreload 2\n",
    "\n",
    "import os\n",
    "from tqdm import tqdm\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "from joblib import Parallel, delayed\n",
    "from ogb.utils.url import download_url, extract_zip\n",
    "from matplotlib import pyplot as plt\n",
    "import tarfile\n",
    "from rdkit.Chem.AllChem import GetAdjacencyMatrix, RemoveHs\n",
    "\n",
    "from molecules.physics import get_self_euclidean_dist_matrix\n",
    "from molecules.parse_sdf import sdf_to_mols\n",
    "from molecules.parse_cxsmiles import get_contact_dict, cxsmiles_to_mol_with_contact, try_read_cxsmiles\n",
    "\n",
    "# WARNING: You need at least 120GB of RAM to read this file and execute the code\n",
    "print(\"WARNING: You need at least 120GB of RAM to execute the code for the full dataset\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "WARNING:root:The OGB package is out of date. Your version is 1.3.1, while the latest version is 1.3.3.\n"
     ]
    }
   ],
   "source": [
    "ROOT = \".\"\n",
    "SDF_URL = \"http://ogb-data.stanford.edu/data/lsc/pcqm4m-v2-train.sdf.tar.gz\"\n",
    "SDF_LOCAL = f\"{ROOT}/pcqm4m-v2-train.sdf\"\n",
    "SDF_LOCAL_ZIP = f\"{SDF_LOCAL}.tar.gz\"\n",
    "RAW_URL = \"http://ogb-data.stanford.edu/data/lsc/pcqm4m-v2.zip\"\n",
    "RAW_CSV = f\"{ROOT}/pcqm4m-v2/raw/data.csv.gz\"\n",
    "SKIP_DOWNLOAD = False # Set to false for downloading and unzipping the file. If already downloaded, set to True\n",
    "OUT_PATH = \"pcqm4m-contact.tsv.gz\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "ANGSTROM_DIST_TH = 3.5\n",
    "PATH_LEN_TH = 5\n",
    "MAX_MOLS = None"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Using exist file pcqm4m-v2-train.sdf.tar.gz\n",
      "Using existing file ./pcqm4m-v2-train.sdf\n"
     ]
    }
   ],
   "source": [
    "if not SKIP_DOWNLOAD:\n",
    "    # This can take many minutes\n",
    "    path = download_url(SDF_URL, ROOT)\n",
    "    if os.path.exists(SDF_LOCAL):\n",
    "        print(f\"Using existing file {SDF_LOCAL}\")\n",
    "    else:\n",
    "        with tarfile.open(path) as file:\n",
    "            file.extractall()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Using exist file pcqm4m-v2.zip\n",
      "Extracting ./pcqm4m-v2.zip\n"
     ]
    }
   ],
   "source": [
    "if not SKIP_DOWNLOAD:\n",
    "    raw_path = download_url(RAW_URL, ROOT)\n",
    "    extract_zip(raw_path, ROOT)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  4%|▍         | 148362/3378606 [00:30<10:30, 5124.56it/s]RDKit WARNING: [00:00:50] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 57%|█████▋    | 1921223/3378606 [08:49<06:19, 3842.38it/s]RDKit WARNING: [00:09:08] Conflicting single bond directions around double bond at index 12.\n",
      "RDKit WARNING: [00:09:08]   BondStereo set to STEREONONE and single bond directions set to NONE.\n",
      " 58%|█████▊    | 1960724/3378606 [08:59<05:25, 4358.73it/s]RDKit WARNING: [00:09:18] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 75%|███████▌  | 2550203/3378606 [11:46<03:45, 3678.85it/s]RDKit WARNING: [00:12:06] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 77%|███████▋  | 2597414/3378606 [11:59<03:22, 3857.10it/s]RDKit WARNING: [00:12:18] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 82%|████████▏ | 2778597/3378606 [12:47<02:42, 3682.53it/s]RDKit WARNING: [00:13:06] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 82%|████████▏ | 2786749/3378606 [12:49<02:27, 4009.88it/s]RDKit WARNING: [00:13:08] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 83%|████████▎ | 2821130/3378606 [12:57<02:15, 4111.82it/s]RDKit WARNING: [00:13:16] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 85%|████████▍ | 2860733/3378606 [13:05<01:36, 5346.46it/s]RDKit WARNING: [00:13:24] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 85%|████████▌ | 2888199/3378606 [13:10<01:28, 5518.46it/s]RDKit WARNING: [00:13:29] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 87%|████████▋ | 2934567/3378606 [13:19<01:58, 3738.33it/s]RDKit WARNING: [00:13:39] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 88%|████████▊ | 2980779/3378606 [13:32<01:33, 4238.94it/s]RDKit WARNING: [00:13:51] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      " 89%|████████▊ | 2990830/3378606 [13:35<01:57, 3308.45it/s]RDKit WARNING: [00:13:54] Warning: molecule is tagged as 3D, but all Z coords are zero\n",
      "100%|██████████| 3378606/3378606 [14:52<00:00, 3786.99it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "3378606\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAIAAADCEh9HAAAABmJLR0QA/wD/AP+gvaeTAAAbz0lEQVR4nO3daVgUV9oG4Ldpmk1EQcCgqAiiCAEDiIiSmIQQF8BEBUUTktGARvxijEZAEyXqTAJxGRw1ZlTccEUMgwqoTRC3kWEVF8JiRAUUEZFGtga6z/ejYg9DlB26gef+VVV96vDWdXk9ntpO8RhjBAAAbaUk7wIAALo3xCgAQLsgRgEA2gUxCgDQLohRAIB2QYxC8x49elRaWsotSySSrKws+dYDoFAQo9C8kJCQEydOcMtlZWUuLi7yrQdAoSBGAQDaRVneBUD3kJOTk5CQQETl5eXyrgVAsSBGoUVu374tEAiIqKamRt61ACgWxCi0yIwZMxYtWkRET58+PX36tLzLAVAguDYKbZGenv7bb7/JuwoAhYAYheaZmZkNHTqUW1ZRUbG1tZ08efJbb72VkpIi38IAFAEPMzxBa4nF4rlz50ZGRvbp0ycyMtLZ2VneFQHIE0aj0GqqqqonTpyYP39+ZWWlm5tbRESEvCsCkCfEKLQFn88PDQ396quvxGKxp6dnaGiovCsCkBvEKDTl7t2733zzjWx1zZo1ubm53DKPx9uyZUtQUJBEIvHx8dm0aZOcagSQM8QoNEUkEl27dk22mpiYWFZW1rCBv7//9u3beTzeypUrAwICurxAAPlDjEJ7LVmyJCwsTCAQBAcHL168WCqVtnzf4mJ6Mbql2lpqyzNUV6/SO+/QhAk0YQIdOdL6/QHaC4/fQzPS0tImTpzILd++ffulbebNm9e3b985c+b8/PPPT58+DQwMtLCwaEnnx46Rnx9lZNCoUfT4MXl5UeueoXr0iD7+mM6do5Ej6elTeu89GjyYJk1qTRcA7YXRKDTDxsbm8gt2dnZPnjzZuXOnWCxu1Iy7Za+pqRkREWFpaenm5paYmNiS/t95h778sq3FRUTQrFk0ciQR0YABtHw5HTzY1r4A2ggxCs1TeoGIDh486OvrO2zYsODg4KqqqobNDAwMKioqdHR01NTUzpw54+Dg8N5778XHx7+0z+fPnxcUFBDRpEmkqUnHjrWpssJCGjLkv6vDhlFBQZs6Amg7xCi0ztixY8eMGfP48eOAgAATE5MtW7ZUVlZyP929e5eIJk6ceP/+/cDAQG1t7V9//dXJycna2vrgwYMSiaRhP5mZmXFxcdzyli20Zg1xU0c9eEAVFS2u5rXXqKjov6uPHpGBQfuOD6D1GMCrVVVV5eTkyFZzc3MrKysZY0KhcNy4cdw/IV1d3cDAwLKysh9//JGIli1bFhYWtmnTpkePHi1btkxXV5drZmFhceDAgbq6uob9b93KfviBMcaCgti8eczWlrm4MC0ttnAhy8pqQX137jATE/bkCWOM1dSwt99mp0934OEDtARiFNpOKBSOHz+eS8kBAwaMHTuWiLZs2WJkZEREmpqaampqGhoafn5+I0aM4JoZGRmFhIRUVVVxPchiVCxmFhbMxoZNmsSIGBHj89mMGSwh4dV//rvv2KVLLDycWVqyqVOZldUffQF0LcQotNf58+fffPNNLiV5PF5wcPDly5ddXV1lZzx8Pv+nn346cODA6NGjuS36+vqBgYHPnj2LiWE//cQyMphYzC5fZv7+jDGWmso++YSpqv6Rp2+8wQ4dKqmpqfmfv5qSwng81qcPe/SIJSay0lImlcrl8AEQo9AxLly48Pbbb6uoqGhoaJw9e5Yx1ihMJ0yYkJmZeerUKdnVAC0traVLl3p7PydiGzc27vDxYxYUxAwNGRF7882F+vr6/v7++fn53K+XfH2lWlrMz4/94x+MiC1f3sXHCyCDGIUOU19f7+PjQ0QqKionTpzgNmZkZFhZWRER0WAe7/9cXV2Tk5PPnj076cXTnXy+so6OrVB4/aV91tSwAwekEyY4co1VVFS8vLz27dtHRJaGhhUFBZIRIxgRi4rqwgMF+B+IUehIUqn066+/5k7k9+zZI9seGLiNz68kYkSreTyeq6trUlJSamqqh4eHiopK//79p0+f3ujuUyMXL16cNWsWn8+XDW/nzJmzefPmkTo6qV5eOKMHOUKMQscLCgrirpNu3rxZtvHgQaaszIiYispOIt62bdu47TExMf369SMiT0/PppOUMVZYWBgYGKijo0NELi4umpqaRBQTE9OJBwPQHMQodIqQkBAej0dEGzfukm08fpypqDAiZmeXWllZJduekpKira1NRB4eHs0mKWPs+fPn3377rZKSEp/P//DDDzvlAABaDDEKnSUsLMzEZLSeXtH//d9/z7ljYpi6Olu6tHHjlJQUbozp7u7ekiRljPn7+xORoaFhSUlJhxYO0DqIUehEJ0+KueGntzerr/9j42+/vfxKZmpqaquStK6uzsHBgYhmzpzZoVUDtA6+xQSdKz6ePviAKiroww/p2DFSVW2qcVpamrOzc2lpqbu7+9GjR5WVm5mB7MGDB9bW1qWlpTt37vz88887sm6AFkOMQqdLSqKpU6m0lKZOpZMnSV29qcYNk/TIkSMCgaDpziMiIjw8PNTU1BITE8eMGdORdQO0DKYmgU43bhzFxZG+PsXG0uTJJBI11djGxkYoFOro6ERERMybN6+urq7pzt3d3b29vWtqaubNm9doximAroHRKHSRrCxydqbKSvr0U7KwIG9vIqJff6XiYpo7t3HjVo1Ja2pq7O3tb9y44ePjs2vXrk47AoCXw2gUuoiZGV2+TLGxlJtLa9bQ778TEd29S7duvaRxwzHp3Llzmx6TqqmpHTlyRF1dfffu3UePHu2c8gFeCTEKXcfIiOztiYi++oqWLGmmsY2NTVxcnI6OzsmTJ5tNUgsLC+7TpIsXL87Ly+uwigFaADEKcvD++6SuTsePN9PM2tq65Unq6+s7Z84ckUg0Z86cZq+oAnQgxCjIx9attHYtcRPnnz9PL2bQb6xhknJvizbR588//zxs2LDk5OTAwMC2VZWamtrwssA333xTU1PTtq6g90CMgnwMHUrz59M//kEiEbm5kZERBQfTSyPL2tpaKBQOGDDgl19+aTpJ+/fvf+jQIWVl5eDgYKFQ2IaqcnNzL168KFsNCwurra1tQz/QqyBGQW6WLyc1NRKL6Y03qKSEAgLIzIz276f//WgTMcYCAwNnzpypra39yy+/zJ49u7q6+lV9Ojo6rl27ViqVenl5FTX8TFMLBAcHY+wJbSHfl6igF8rNZZWVfywXFrKCAiaVsn/9i73++h/T3ZuZsX/9q0j64o3RkJAQItLX1z979qxAIDAxMTExMUl49ddFJBKJk5MTEU2ZMkXamgn0pkyZsmzZMhMTk9kvaGhoiESidhwr9AqIUVAUEgkLD2empozHk1pYjHv99dfDw8MzMzPV1dWJKCoqaunSpUSkqqpKRHw+f8WKFbJvOjVSUFDAfUpv06ZNTfxFkUgUFxcnW925c6ejo+NHH31074VBgwYhRqFZiFFQLLW17MCBvMGDB3NnSw4ODtOnT/f29hYKhTweTyAQXLt2LSgoSEVFhYiMjY1fNSyNiYmRtX/V3yoqKtLW1haLxdxqYWFhnz59fHx8ZA2GDBmCGIVmIUZBEVVVVW3atEn2cWYnJ6fXXnuNiL7//nuuQUZGhrW1NRHxeLyFCxdWVFT8uRNu9GpiYtIwCquqqoqLi2Wr48ePFwqFstURI0a4urrKVhGj0BKIUVBcFRUVQUFB/fv3JyI1NTVjY+N62XR7jNXW1jYcll64cKHR7jU1NVzUzp49W7YxODjY19dXthoSErJr138nlv73v/+dlJQkWxUKhS2c/BR6M8QoKLqSkpIlS5Zwk+b97W9/a/RrRkaGjY2NbFj6/Pnzhr9mZ2draGhoaGjk5uZyW/Ly8sLDw7uodOgdEKPQPYSFhXFJ6u/v3+j+e8Nh6fDhw+Pj4xv+OnDgQB6Pt3r16q6tF3oRPDcK3cPHH398+PBhgUDAnZVLpVLZTwKBwN/fPzk52cbGJi8vz8nJadGiRRUVFUSUk5PDXQk1NzeXX+3Q08k7xwFaITo6mnv+ad68ebW1tY1+raurazQsXbx4Mffv/P79+3IpGHoDzDcK3cylS5fc3NzKy8vd3NzCw8PV1NQaNUhPT58/f35GRoaSkpKSklJ9fX3//v2fPXsml2qhN8BJPXQzb7311q+//qqrq3v69Olp06ZxJ+8NWVtbp6SkBAUF8fl8DQ0NbsucOXPkUSz0ChiNQreUmZnp7Oz88OHDcePGxcbGcp8UbeQ///mPs7Pz8+fPzc3NL168KHsKFaBjYTQK3ZK5uXlCQsLQoUPz8/MXL14sevGBp3Pnzu3Zs4dbtre3t7e3J6LMzMzNmze3sOdbt275+PjIVhcsWJCVldWhtUNPgxiF7srU1PTy5ctCoTA9PV0sFnMb8/PzG6be3bt3iUhFRSUoKGjr1q0t6ba6uvrevXuy1Xv37jUxoRQAIUahWxs6dKiFhcWrfi0vL8/Ly1NTUwsNDeXxeMuXL4+IiOjK8qCXUJZ3AQAdwMXFhXs4v7i4eMaMGdzG9PR0xpilpeXHH39cUFCwatWqjz76SFtbm5tGrwnJyckODg7ccmZmZqdWDj0AYhR6gujoaH19fSLas2eP7KT++vXrRPTGG28QUUBAQFFR0datW2fNmnXp0iUrK6smerOzs5NNnv/uu+92bunQ/eGkHnqshjFKRFu2bHF3dxeJRNOmTXvw4IFcS4MeBTEKPVajGFVSUgoLC3vzzTcLCwu9vb1fuktaWlrD10wBWgLPjUK3l5WVNWLECO7aaGlpqVgsNjAwqK2t7du3b319vUgk0tTUlDV+9uzZggULPDw8KioqFi5cyG38y1/+smvXrqSkJGdn52nTpoWGhnKz8xFRRUWFuro6n8/v+uOC7gKjUej2zMzMuAwlIh0dHQMDAyK6fft2bW2tqalpwwwlIm1t7cjISIlEcvPmTdnG8+fP5+bmzpw5s6amRldXV5ahRKSpqYkMhaYhRqFnanRG3zSpVDpjxownT564uLjs2LGjk0uDngZ36qFnajZGT548mZ6eTkRSqbS4uPjx48e2trbHjx+XDWwBWgijUeiZmo3RmTNnXrx4MSEhwcjIiDE2bNiwM2fO9OnTpwtrhB4C//FCD8QYy8jIoCZjlMfj8fn8r7/++ujRozweLyIigvtqHkBrYTQKPVBaWppIJNLQ0IiMjLx27VplZeVLm+3evXvz5s0CgUBbW7uJl0oBmoYHnqCnqaqqcnJyys3Nffr0qWyjgYGB7Qvjxo0TCASnT5/29vaWSCT79u2zsbF5/fXXeTyeHMuG7gsxCj2KRCLx8PCIjIw0MDD4/PPP7927d/369Vu3btXV1TVsNnjw4JKSErFYvG7durVr18qrWugZEKPQczDGfHx8QkNDdXV1L1++bGZmxm2vr6/Pzs5OTU1NTU3NzMxMS0srLS0dNmyYra1tREQEBqHQTohR6DlWr179ww8/aGhoCIXCCRMmvKqZVCq1sLDIysq6cuXKxIkTu7JC6JEQo9BD7Ny509fXVyAQREVFTZ069c8NampqPDw8xo0bt2LFin79+jHGRCIRnnCC9sOdeugJoqKivvjiCx6P989//pPLULFYvHHjxoaXRNPT08+cOXPixIm0tLT6+npLS0tkKHQIxCh0ewkJCZ6enhKJJDg4eP78+UQklUo//fRTPz8/2eQjRJSUlERE48aNky3Iq2DoYRCj0L3dvHlzxowZNTU1vr6+K1eu5DauWLHi+PHjWlpaS5culbVMTk4mIjs7O9mCXAqGngcxCt1YXl7e5MmTy8rKPD09t23bxm384YcfQkJCVFRUIiIirK2tZY25QaidnR1Go9CxcIsJuquSkhJHR8fs7Ox33nknNjZWVVWViA4dOvTJJ5/weLxjx455eHjIGpeVleno6Kiqqubl5Q0aNEhdXV0kEmEWEugQ+GcE3VJVVdX06dOzs7OtrKwiIyO5DI2Ojp4/fz5j7O9//3vDDCWipKQkxpiNjU1aWhpjzNbWFhkKHQUn9aAo7t+/f+vWLdlqTEzMq1rW1dW5u7tfu3bN2Nj43Llz/fr1I6KkpKQ5c+bU19d/++23X375ZaNdcH8JOg9iFBRFXFzc/v37ZateXl4v/SwSY2zhwoWxsbF6enqxsbHctEx37txxc3OrrKz08vJav379n/fC/SXoPIhR6Gb8/Pz279/ft2/f2NjYkSNHEtHDhw+dnZ2Li4tdXV337t370pc7ZemZkpJCGI1Ch8LlIVAgt27d2rt3L7csFouvXLmirKw8atSoAQMGcBt37NixadMmgUBw4sQJW1tbIiovL3dxcbl37569vf2xY8deesUzPz//0aNHOjo6fD6/uLhYT09v+PDhXXZQ0OMhRkGBMMYkEolsdc2aNZcuXSIiXV1dMzMzNTW1+Ph4JSWlAwcOTJ48mYhqamrc3NyuX79ubm4eExPzqreSZI86cWNSDEWhYyFGQYFYWlr6+PhwywEBAVZWVlVVVdnZ2SUlJVeuXCGiQYMGLVu2bO7cuVwbf3//S5cuGRoanj17VkdH51XdFhcX9+nTZ+zYsbgwCp0B10ZBcW3dujU5Obm8vLygoODw4cNEJBaLZa8qEdHq1audnJzOnj07ZMiQJvpZvHixSCQKCAiQDUs7u3LoVRCjoCjMzc0bTlvn7e0tu1k0ePBgFRUV+tP5+MCBA+Pi4lry/Q8+n6+urp6WlkZEY8eOlW1ftmwZF9BEVFhY2MIPMgM0hJN6UBQODg4NV4ODgxuupqam0v8mYGslJCRUVlZqampu377d1NR05MiRI0aMkEqlsseqGl2ZBWghxCh0D1yMcnfn26C8vHz58uW6urolJSUbNmyQbZ8+fbqlpWV5eTkRVVRUdEip0NsgRqEbYIxx5+Nti9G6urrZs2ffuHHDyMho3bp1RUVFuS/069dv27ZtERERRCQWizu4bugdEKPQDeTl5T19+nTgwIGGhoat3ZcxtmjRonPnzunp6QmFwhEjRjT8denSpStXrvTy8iKigoKCl06bD9A03GKCboB79ahtd9i/++67ffv2aWhonDp1qlGGAnQIxCh0A22+MLp3797169fz+fwjR46MHz/+zw20tLTU1dW5ZT6fr6ur285SoRfCfKPQDTg5OcXHx586dcrNza3le8XHx0+dOrW2tnb79u1LlizpvPKgl0OMgqJjjOno6JSVlT18+NDAwKCFe926dcvR0VEkEn3zzTd//etfO7VC6OUQo6DocnNzR44cOWjQoMLCwhbuUlhY6ODgkJ+f7+npeeTIkZfO+QTQUXBtFBRdax+8Ly8vnzZtWn5+/qRJk/bv348Mhc6GGAVF16r7S3V1dbNmzbpx44a5ubns4yIAnQoxCoqOe9rJ1ta22QtQjLHPPvssLi5u0KBBsbGx2traXVIg9HZ4/B4UGmMsPT2dW+jXr5+VlZWtra2tra2jo6OxsXGjxqtWrQoLC+vbt290dPTQoUPlUS/0RohRUGg5OTkikWjIkCEPHz58/vz51atXr169yv00ePBgOzu71atXc4/l7969Ozg4WCAQREREYKIm6EqIUVBo3Oz3enp6jo6OBQUFaWlpqampqampiYmJhYWFhYWFfn5+RBQdHe3r68vj8Xbt2vX+++/Lu2roXfDAEyiuJ0+e2Nvb19fX5+fnE5GmpuaYMWO4k3obGxtlZeXk5GQPD4/bt29PmjSpsrJy/fr1a9askXfV0OsgRkFBiUSit99++/r168bGxlZWVmlpaQ8ePGjYYODAgXZ2dqampmFhYSUlJQsWLAgNDZVXtdCbIUZBEVVXV0+ZMuXSpUumpqaXL18eOHAgEZWVlaWkpFy5ciU1NTUpKam4uJhrrK+vb25ufu7cOW6GfIAuhhgFhVNXVzdjxozo6GhDQ8MrV64MGzbspc1+//335OTkBQsWVFdXZ2VljRo1qovrBODgFhMoFsbYwoULo6OjdXV1z58//6oMJSITExNVVdXq6uoBAwYgQ0GO8Pg9KJbly5fv379fS0srNjZ29OjRTTfOyMggIjzeBPKFGAUFsnbt2pCQEBUVlYiIiJa8RH/9+nUiGjNmTOeXBvBKiFFQFDt27NiwYQM3xbKzs3NLduFGo4hRkC/EKCiEyMjIL774gsfjhYaGzpo1q4V7IUZBESBGQT62bt16584dbjknJyc3N3fChAkbN2789NNPW9hDVVXV77//LhAImr2ECtCpcKce5EMoFI4dO5b7xlxRUdHVq1cvXLggEAha3sPNmzclEomFhQUeFwX5wmgUFEWrMpRwRg8KA6NRkJtVq1bp6OgQ0dOnT7mFVkGMgoJAjILc+Pn5cXPcJSYm7t27t7W7I0ZBQSBGQW60tbW5l+XbME09Y+zmzZtEZGVl1fGVAbQGro1Ct5SXl1deXm5gYKCvr09EoaGh0dHR8i4KeimMRkE+NmzYMHz4cG7Z0tLyu+++a9Xu3PtLstdAc3Nz6+vrO7RAgJZCjIJ8WFtby5a1tbVbe16PC6OgOHBSD90SF6MnT550cHBwcHAICwuTd0XQe2E0Ct0SF6NRUVHcK0wBAQHyrgh6L4xGofspLy+/f/8+j8czNTWVdy0AiFHoburr63fu3MkYU1JSUlbG6RTIHz4iAt3G7du3w8LCDhw4UFRUpKurW1VVlZWVNWTIECJ68uSJQCDo37+/vGuE3ggxCoouPz//8OHDhw4dun37NrfFzMyMiLKysqytra9cuaKhoSHXAqG3Q4yCPEkkEiUlJR6PR0SMMalUyufzuZ+qq6vPnDlz8ODBs2fPcs+Eamtre3h4eHl5TZw48dmzZ/b29nfu3HF3dw8PD+d6AJAPBiA/Tk5OycnJ3PL58+c9PDwkEolQKPTy8tLU1OT+iaqqqrq6uoaHh9fW1jbcNzMzU0tLi4h+/PFHedQO8AdcoQcFIhaLBw8eXFRURERKSkqTJk3y8vJyd3fv16/fnxuPHj364MGDM2fODAgIMDc3d3Fx6fJ6AYhwpx7k7tmzZ8XFxcXFxWVlZaqqqvr6+mZmZoGBgTk5OQkJCZ999tlLM5TzwQcfrF27ViqVzps3LzMzsyvLBpDBtVGQp/fee6+uro67w/7kyRNDQ8OffvpJV1e35T0wxjw9PcPDw0eNGpWYmIib9dD1MBoFOdu8eXNUVFRUVNS6deuIqFUZSkTcV/AsLS2zs7M9PT0lEknnlAnwSohR6PY0NTVPnTqlp6d37ty5NWvWyLsc6HUQoyBPAwcOVFVV5ZbV1dX19PTa1o+RkdGxY8eUlZWvXr1aV1fXcQUCNA/XRqHniI+PNzAwCAsL+/7777ktq1at8vb2NjExkW9h0LNhNAo9x7vvvltVVZWUlCTbkpSUJBKJ5FgS9AaIUQCAdsHj99DTpKSkODg4cMt4mBS6AGIUepqxY8fGxcVxy05OTvItBnoDnNQDALQLYhQAoF3wwBP0KNXV1Y8ePTI2NuZW7969a2BgoK6uLt+qoGdDjAIAtAtO6gEA2gUxCgDQLohRAIB2QYwCALQLYhQAoF3+H2x+Ckz2JN34AAACXnpUWHRyZGtpdFBLTCByZGtpdCAyMDIxLjAzLjIAAHice79v7T0GIOABYkYGCJADYgUgbmBkA9MsbA4aQIqZeFphAYhmJKiOQQVkLRIfQrND+MzsCitANBMjB0SCiRFMMzLSiuZmEGJgFGVg4sxgYhYHeiCDiYULiJkSWCUZWHkzmNhYE9h5GDi4M5g4GRM4GRi4mBO4eRO42Rl4ZFmYePgYeLgYeAUU+AQ1mPjZMpj4ORIE+BSEGRhEGBjEmBgkWBik2Bik2RlkOBhEmNkYOYGGM7OxsvFzcPOysXPzCvDxiDPCokFu6d75DhXcKw5YpDc4/I457CC01PHAOvdEh3OrJjrYzq488OXvF/uIU6ccXH593R/wR8dh/tkZDkbPjA6oPem29/1s5hB9eY79tpYn+zu+GAPF4+z95dwO1NrvdOg/FLp/Q1HEfhu/qQ5u2z7vE7ngcMDj4TIHf4fGA8tfeDj8WbnV4dOlp/uz9uyxTzSa7SBZHL7vlvSZ/W/09zoEefLun/hWxl61tMphXpyl/QKp/P3HvRc6OH5Utmd53mP/6VKuA8/klTZLdfIPHNlY58DP3WvPlbHILqB3pYPPskn29uHcDgqXljosvLbgwHrVRQ6eelsdFJIPAdXmAe2sdej+u/mAsXE1kL7scLLM7cAOuX4HL54yBzObqQf+tp+xX9D5wEH59sT9KWccHZZXtjt8aNU9oLtJ1u5aGAfQ/Z/t725ds5/9HKPDhAUL7O9Nzj8QVnvOIVXy1P74GUv2S7KscYg4NWl/hlLCgTjvew6HL2fv69XwtRcDALF2x6dRi6LQAAAC13pUWHRNT0wgcmRraXQgMjAyMS4wMy4yAAB4nJVW224UMQx936/ID5C1HTtOHqGLhIQol4fyiNpSCQRVgbYS8PU4iWcY0FZVRqPdnEl8xjm+TPZnN1/vr69u92/uL04+XV2/PTmc350/O7+9en/z48v+2/3FpT39fkmA+tFmLmxm//PX7z349aH9VLv2EO35LrTr3eHl57uwXumw24UEIVEI0G9cBn6bfTgjY+r2HGvFaoMnEkmQxzNAyuEk/Gd59O4sOSIINpYUgUS7J1HsLTMsHEXIWSpAGwWMFXmKJceUlBqL2RJ2XygqUJ3zRXXsyGyrpOEL1DkWikVKHrZE4l5pMb45FsTSRhCLgrrOVaZiJPbeCs3WWJIsIxY5xpIe1CVnKcOWNYP7gqRzvhAODyzXUsWRL5gqzbFkVXBNq+2j68zKR3f0cKQL1zp2RAg8+KTypLoVR+6CZXGvKItWxrTNXXqMxfIeEw9bJXa+muYqQCIwiHvAfUemCwKUGZYUFXt8jQVoyTpNiuF0hqVqzYsHiy4JrUKPsBwRaMmXWjy+yOI1jWosr2d0wbL0OqBMrlW2Hb2Yyro8WHIE5exake1ygsV0yaN6jI/YO2Ylq4oJlrzYWmRMXRj5zEoy50thllGNOSePlljgZljUukAuo3qskmUwA5UpdTlS6h60vouYRr6g8JQulhsJvGfbl8RrOnFNcyzmPXn3Fq5eAWwVOhUjFnJdxFrwGFGRKXUlJu0drqnLQ2f7wgJNqZujtTX1XucK2TcAcGJHGFr24wAUiFaQQstAHoAD8TrDvbR9RgLiBrRPjYMc7Nix2OTQTiM+ow0voISWF76sBlyp2+v/Abgs8zf6DG2om3VZl6V2dmogd4CymcG/bBzaucKB7aeM1mUgd195BXUFumGjrW+EW5C6IA6kC+RAO7WDsvHaziRhCckrOxE+PXR32oL2349A1Gaenx52fwBQFbAlH7LgzwAAAcZ6VFh0U01JTEVTIHJka2l0IDIwMjEuMDMuMgAAeJxdkr1qXDEQhV8l5RquxfyPxkvAsI2rJEVIs2zALO5srwku/fA5o02RpLmDPh0dnRnd48PpeDjxWc6748Pp5vVa/nzl+OV02H3+enM83N+f+Ar5H8nusOr6/IUZ308fuxjmMrdbHp6zusr02vtYKxpTfRVz3xtKLSpMts6UBXCEz8aWsd3qIJaEg6Z7i9hiNnYS3utIjo0GCWXD1OS9jMk8QWdeKZUHKMmUDYncamlNrbU+o6m4tH1OV1BWUtCiazK1UlxWrAbfFOMOWDAAzGoDJi7sKacgLRk5VmE433s0AaWm98o8N1yRS1ksy8x9nQ/WfQwMItdkOgYaITZII3NFLG8bS+shZjrOS9NOTCUFKqqxKHMbsBuge1+l3RV3c9zxpxnm2lPXbsPRTkflBUmLN8U0SnC+ChFvselsm/XDBKQ8r5QkZEMJPAGyRtMYlBZwSKnoWUW0NMQSsMTRK5OvVCTe0AVsCcAwVFxkuYSquZ6ohHt+Seg0kSLWD4eMvrXL5JvtJ9+hQ94e3y8v335d3u54vFyev1/efzw+P72en4be8f9IPn4Dn1isShuZbd4AAAAASUVORK5CYII=",
      "text/plain": [
       "<rdkit.Chem.rdchem.Mol at 0x7f3f816ead60>"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "mols = sdf_to_mols(SDF_LOCAL, max_mols=MAX_MOLS, removeHs=False)\n",
    "print(len(mols))\n",
    "mols[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 3378606/3378606 [12:09<00:00, 4630.24it/s]\n"
     ]
    }
   ],
   "source": [
    "all_contact_dict = Parallel(n_jobs=-1)(delayed(get_contact_dict)(\n",
    "    mol, angstrom_dist_threshold=ANGSTROM_DIST_TH, path_len_threshold=PATH_LEN_TH\n",
    "    ) for mol in tqdm(mols))\n",
    "\n",
    "# these_mols = mols[150000:]\n",
    "# all_contact_dict = []\n",
    "# for mol in tqdm(these_mols):\n",
    "#     all_contact_dict.append(get_contact_dict(\n",
    "#         mol, angstrom_dist_threshold=ANGSTROM_DIST_TH, path_len_threshold=PATH_LEN_TH\n",
    "#     ))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "def validate_contact_maps(all_contact_dict, idx):\n",
    "    # Validate visually that, when reading the cxsmiles, the contact map gives the right information\n",
    "    contact_dict = all_contact_dict[idx]\n",
    "    cxsmiles = contact_dict[\"cxsmiles\"]\n",
    "    mol, contact_idx = cxsmiles_to_mol_with_contact(cxsmiles)\n",
    "    xyz = mol.GetConformer(0).GetPositions()\n",
    "    dist_matrix = get_self_euclidean_dist_matrix(xyz[:, 0], xyz[:, 1], xyz[:, 2])\n",
    "    dist_matrix[np.tril_indices_from(dist_matrix)] = float(\"nan\")\n",
    "    plt.imshow(dist_matrix)\n",
    "    adj = GetAdjacencyMatrix(mol).astype(float)\n",
    "    adj_4 = (np.linalg.matrix_power(adj, 4) + np.linalg.matrix_power(adj, 3) + np.linalg.matrix_power(adj, 2) + adj) > 0\n",
    "    adj[contact_idx[:, 0], contact_idx[:, 1]] = 2\n",
    "    adj[np.tril_indices_from(dist_matrix)] = float(\"nan\")\n",
    "    dist_matrix_inv = (dist_matrix ** -2)\n",
    "    dist_matrix_inv[adj_4] = 0\n",
    "\n",
    "    plt.subplot(1, 2, 1)\n",
    "    plt.imshow(adj, vmin=0, vmax=2)\n",
    "    plt.subplot(1, 2, 2)\n",
    "    plt.imshow(dist_matrix_inv, vmin=0, vmax=ANGSTROM_DIST_TH**-2)\n",
    "    plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXAAAAC5CAYAAAAxiWT3AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAAAVRklEQVR4nO3df2yd1XkH8O9zr69/JCE/nMSpCQEbSCo6VIywQqCVBqWMjH9oNW0q0qYgIaXTxgYbnQitVuC/IBUQU9dKqYrIprYbU9slmtAyK2qHWGnAoSGEhiQmJODEjU2o88O/7fvsD78Gn3Pe6/v6ve9973vs70eK7PPm3Pc+Nk8Or8/xOY+oKoiIyD+5WgdARETxcAAnIvIUB3AiIk9xACci8hQHcCIiT3EAJyLyVEUDuIhsFZFjItIjIjuSCoqo1pjb5AOJ+3vgIpIHcBzA3QB6AbwB4H5V/W1y4RGlj7lNvqir4LWbAfSo6kkAEJF/A3AfgJJJvmbNGm1ra/uk/Xb/OadPw4dDFYRUG5s+P2y0jx9eEqsPVWYUQxjXMUngVvPO7Xpp0EYsTeCtyxvbkMz75EfNdt2A+2/PztuhkAe+pWJ+y5PK7YnPuF9nsd5s54edLshPmDHKlBuz5suniVwwbz52tft1NXwQEoDlMzeOGO1hrXf6DI43Ge2pojk5MtE/iMmLw07QlQzg6wF8OKvdC+DWuV7Q1taG7u7uT9rtzz/j9Ln+735dQUi1sW/fIaN9z5UdsfpQZQ7o/qRuNe/cbsRS3Cp3JfX+c+r5xhajrWFjkdiDmNtp+QlzkGj53q+cPnbeHhwbd/rc0mAOSEnl9pkHbneuDW+YMtrNv3FngZeeM/vUX5hw+oyvKBhtKbqDfMPLbxjt49/a7PTZ9JevO9dsj+55x2i/NXq102dP701G+/dD5oB+6h92hd67kjnwsLRxvgsisl1EukWke2BgoIK3I0rNvHN7AmMphEVkquQJvBfAhlntqwCctTup6i4AuwCgs7PT+Efw/sOPOjdth/lU7sMTeZQnDrtPz3NbnD4+fK2LxLxze7k0p3ao0PWPlM+Tpv9dZ7Qn1X1We2+wvex9avmT4vqn3Z8IbH1/7z6lF0bMrzU3kXf6jC8v/+zaYLWjPG2Heeb6PzDa7/24w+kzNWINxUXzGaI4GR5vJU/gbwDYKCLtIlIP4GsA9lZwP6KsYG6TF2I/gavqpIg8BGAfgDyAF1T1nTIvI8o85jb5opIpFKjqywBeTigWosxgbpMPuBOTiMhTFT2BV4O9sGkvaobxcfHPx5jJHyN/6O6xsF2NvhQiie/kztuca7lJs93826LTp+GC+WuEhcuTTp9iwXx2VXed09H/kLtg2vLd8gutvY+br1t6wO1TN2qugRet31MfcH8FHACfwImIvMUBnIjIUxzAiYg8lbk5cFvYZp+7c3+ayL33nT0079ekubEhLD5uwacofMztPztpHkVQPDXq9EFvo9mnzp0bnmw0n0vrCu5z6lSj+bqpgnufvqfNOfgVPeX3ah1/odO51vxr83WFIfc+OXPaHlPmTn+IO9U//bqyERERUSZxACci8hQHcCIiT3EAJyLyVOYXMcN0Ff/DaMc9VzzOok2apwhywZLiynru/PmpO5xrx//9s0Z77e/dlTu7OMPSPvd88vyouXEndzmsj3mGuUrIYmiTWcCh6fyU08eWG3SH1Lx10rDm3PfKj5hfa84uSsFFTCKihYUDOBGRpziAExF5qqI5cBE5BeASgCkAk6rq/hZ7CqJU9gkTZ+6ah1AtDlnJ7YXigyfMA52Ov+3WqWztNyd6C8PuxG9+zLxWFzK/LeOTVtt9r9yIOQ+tuZDamn3mfeovuvc5/6C52Wf1YacLlp0xY5SQ/UD5UXN+3Z4nz02ET4InsYh5p6p+lMB9iLKGuU2ZxikUIiJPVTqAK4D/EZGDIrI9rAOr0pOn5pXbrEpPtVDpFMoXVPWsiLQA6BKRd1X1ldkd5qpKT5Rh88rtNKvSE82otCbm2eBjv4j8HMBmAK/M/ap02AubSZ1gSIvDfHN70y3Xoqv70w1miznfPtruVtJZ0WMuwjX1u0PPkn7zp5jcmLtxxl7Myw2F/OQzab4ubBETam2UCdnIU29tyskPuwumS8+ZG4IQUjinbsitCGTLWZuPnLmRYvjzQewpFBFZKiJXzHwO4I8AHIl7P6KsYG6TLyp5Al8H4OfB/7nqAPxYVf87kaiIaou5TV6IPYCr6kkANyUYC1EmMLfJF14eZhWHfQAWEH4IVjncyEM0t0vtYVfNyeGmGwbd1w2tNNr5cXfet2HQnN+uD5lzlilrnnzYLTlfXNpgtLXOnU2eWFHvXLONrbSq/4y6MatVYd4+kAsAYPVx4gmZowf4e+BERN7iAE5E5CkO4EREnuIATkTkqUWziBmGm32oWsIWze38itKn1nr+9WajnS+4m2umfmdWrtF8yMl51hpcyxWXnS7nl6w07xNSuaau0bxWrHcXKHOT1oJg3u1jLxIWC26fKeu96kbc593JJmuBMuRL14KzK8fto2XiCV/D5BM4EZGvOIATEXmKAzgRkacW9Ry4zYc5SaJUnTc3vEjrsNNFV1mHPF0suPdZZh7W9DdX73e6fLvwgNGeDCldoxdKTAbP7mNvegl5TNV8rmwfsc+gCtmAY/cJ23wk9gFck+4cuL25JwdrraHEWZd8Aici8hQHcCIiT3EAJyLyVNkBXEReEJF+ETky61qziHSJyIng46rqhkmUPOY2+S7KIuaLAL4L4F9mXdsBYL+q7hSRHUH7seTDqz17YZOLmgvKi1jEuR1F3SVro8qV7mpa/alGo33F6ZDFRzFP9tvR84DTp6XHrJyTC1k0rLtk9slfcivySNFcJJRRt5KOWAuJYacR2hWBciEVeZadtar2jLsLlHWXrdcVQxYx7XhyZjwStyJPUAfwY+vyfQB2B5/vBvCVcvchyhrmNvku7hz4OlXtA4DgY0tyIRHVFHObvFH1RUwR2S4i3SLSPTAwUO23I0oNc5tqLe5GnnMi0qqqfSLSCqC/VEdV3QVgFwB0dnaW+HV0f7Cyz4IXK7eXS7POd33Eh/WUtn98LZH7nH7qdqNdbHCHgvEV5gFO9Rfcg7PGVpsbixrVvU9uxKpCPxlymFXI4VW2i+3mIV0NFxqcPn23m0PoxAp3frv5sPm6Ysio2/ix+XXYc95TveHxxn0C3wtgW/D5NgB7Yt6HKGuY2+SNKL9G+BMArwH4rIj0isiDAHYCuFtETgC4O2gTeYW5Tb4rO4WiqveX+Ku7Eo6FKFXMbfIdd2ISEXmKpxEmgJV9aNMt16Kr+9MF7lrnQNhiezlJxXzh5euda7n/M9v5sZBTBXXuhTwAKNZb1XZCqvY47NMJI5pqMF831eg+704sNxctV14z6PQZ6VtttCebQhZex+0qQlbloRJrrnwCJyLyFAdwIiJPcQAnIvIU58CrgJV9aDG79Kp7+sCys+a872Sj0wWN580NOHUj7kaeuiGznb8YcpjV+MSc7aiW9ZqHUNUN2yV6gDVvmpt9Jt5d7fRZfcZ8XbHOnZNvGLTubU2T58diHmZFRETZxAGciMhTHMCJiDzFAZyIyFNcxEwJK/vQYtFy5xnn2pnuK4122Il89ZcLRrth0N29UiyYC4Ahe2KQGzZfl8u7z6nFJWaFIAmp/nN5vdmnMSSej2+0Tg1cFbJgmjPvE7YpZ3yZGWPdqHlfDVn4BPgETkTkLQ7gRESeiluV/kkROSMih4I/91Y3TKLkMbfJd3Gr0gPAc6r6ncQjWiSiVPZZKFV7ep7bYrQz9HW9iIRy+/jBk6mta8Q5qCrN9wr7PrTjdBLhRPLeztuM9vKTbp9LbeXv0/7N8tWIrkup3EdOh8Kvl3thicrdRN5jbpPvKpkDf0hEDgc/hq5KLCKi2mNukxfiDuDfB3AdgA4AfQBKVvVl5W7yTKzcnoB7JgdRtcUawFX1nKpOqWoRwA8AbJ6j7y5V7VTVzrVr18aNkygVcXO7ALdiOVG1xdrIIyKtqtoXNL8K4Mhc/Skau7JPe+mHv09kaEGwJB9inJG13M76gmUWXbvDXHz84Mnb3T5byi+qhp//V7mz33DjGVlnVSOy3nzs+fB/Q2UH8KBy9x0A1ohIL4AnANwhIh2Y/hpPAfh62aiJMoa5Tb6LW5X+h1WIhShVzG3yHXdiEhF5iodZZZg9Jw7wEKyFZKHMOWfNiX+61WivPOrOZh97v9W8EDLhvQnmoVz2hjQg2vrO7x4257yX9hWdPvWXrMOq7Io8o+H35hM4EZGnOIATEXmKAzgRkac4gBMReYqLmJ6xF77sEwzD+LSRhqhSG//2QNk+cfaEx/13NLzeXJGsG3Wr61xsN9t2j2KJjb58Aici8hQHcCIiT3EAJyLyFOfAPVfNzT77zh4q2+eeKzsSeS/fbbrlWnR1f7o+EfbfgBt3auPp99058Y6G8qdHxsnt00+5B1WtOGHOgS/pn3L6iF2q3trIkytxWjGfwImIPMUBnIjIUxzAiYg8VXYAF5ENIvILETkqIu+IyMPB9WYR6RKRE8FH1g4krzC3yXdRFjEnATyqqm+KyBUADopIF4AHAOxX1Z0isgPADgCPVS9UiirKZp8omxKiLOLYJ7R5tmmIub0IPNZ+a/lOCbnmiV+V7RNWIWjjnSeNdlHNrTzvvTIeeq+yT+Cq2qeqbwafXwJwFMB6APcB2B102w3gK+XuRZQlzG3y3bzmwEWkDcDNAA4AWDdTOzD42FLiNaxKT5nH3CYfRR7ARWQZgJ8CeERVL0Z9HavSU9Yxt8lXkTbyiEgB0wn+I1X9WXD53EwFbxFpBdBfrSCpMmGbfeyK93Hnrj2b83ZUK7e5aYdm9DxrrhOtfNct//P2sQ1z3mN0tBB6PcpvoQimC70eVdVnZ/3VXgDbgs+3AdhT7l5EWcLcJt9FeQL/AoC/APC2iBwKrn0TwE4AL4nIgwA+AMBijeQb5jZ5rewArqqvwj2edsZdyYZDlB7mNvmOOzGJiDzF0wgXKXth017UjMr3RUxKXtgCrn06Y5Q+Pvpo+23OtTWHzPaS/kmnjxTnHooHhsJ/UOQTOBGRpziAExF5igM4EZGnOAdOAKpb2YcozsamrM2T9/3nDc41fdU8qHL5abfaTs66lB91+xSG8s612aQYfp1P4EREnuIATkTkKQ7gRESe4gBOROQpLmJSSfYiEhc1aTGbmnKfd8dbzJMFmwbcPoVhcwVSc+6mHLXWMHMTZlvcAwyn+4VfJiKirOMATkTkqUqq0j8pImdE5FDw597qh0uUHOY2+a6SqvQA8Jyqfqd64VGWZG1jRQKY25QJ9px30SrAoyUOPY5yHngfgJkCr5dEZKZyN5HXmNvku0qq0gPAQyJyWEReEJFVpV9JlG3MbfJRJVXpvw/gOgAdmH6KCT1QWkS2i0i3iHQPDAxUHjFRwpjb5KtIA3hY5W5VPaeqU6paBPADAJvDXququ1S1U1U7165dm1TcRIlgbpPPys6Bl6rcLSKtwRwiAHwVwJHqhEhZZi9stj9fvrJPVqr4JJnbxw+enPeCbpwT+nyQ1MJ21hbIr/qTd6p27yvK/H1eh0KvV1KV/n4R6QCgAE4B+HqEexFlCXObvFZJVfqXkw+HKD3MbfIdd2ISEXmKh1lRoqpZ2Wff2UNz/v3me4YTeZ84Nt1yLbq6P53TDvuaF+qcdxxpbgqL+32vVjzfO/2qc+26wrI5X1Mqt/kETkTkKQ7gRESe4gBOROQpDuBERJ7iIiZVXZTNPlE299xzZcecf39cz88rriRF2cgTZ1FsoS58Zm2TTpr+6povzvs1pXKbT+BERJ7iAE5E5CkO4EREnuIcOKUubLNPu3Via1YOvKqmhTq/nZS4m30W0/eVT+BERJ7iAE5E5KkoVekbReR1EXkrqNz9VHC9WUS6RORE8JFlp8grzG3yXZQn8DEAX1LVmzBdYmqriGwBsAPAflXdCGB/0CbyCXObvBblPHAFcDloFoI/CuA+AHcE13cD+CWAxxKPkBYFe2HTXtSMYuyZ+S18JpnbPI1wfpL6Xiz272nUmpj5oGJJP4AuVT0AYN1M2angY0vVoiSqEuY2+SzSAB4UeO0AcBWAzSJyY9Q3YOVuyjLmNvlsXr+FoqqDmP5xciuAcyLSCkwXgcX0E0zYa1i5mzKPuU0+ilKVfi2ACVUdFJEmAF8G8DSAvQC2AdgZfNxTzUBpcYlT2ed8icrdpVQztxf73KxtIcx5p1lFKKooOzFbAewWkTymn9hfUtX/EpHXALwkIg8C+ADA4j1ejHzF3CavRfktlMMAbg65fh7AXdUIiigNzG3yHXdiEhF5igM4EZGneBohecNeRKr1AhJRrfEJnIjIUxzAiYg8xQGciMhTnAMnb9lz4iJysEahENUEn8CJiDzFAZyIyFMcwImIPMUBnIjIUzJdlCSlNxMZAHAawBoAH6X2xslgzNVXabzXqGpNznVlbqfKt3iBKuV2qgP4J28q0q2qnam/cQUYc/X5Fm8YH78G32L2LV6gejFzCoWIyFMcwImIPFWrAXxXjd63Eoy5+nyLN4yPX4NvMfsWL1ClmGsyB05ERJXjFAoRkadSH8BFZKuIHBORHhHZkfb7RyEiL4hIv4gcmXWtWUS6RORE8HFVLWOcTUQ2iMgvROSoiLwjIg8H17Mcc6OIvC4ibwUxPxVcz2zMc2FeV4dvuZ12Xqc6gAfFY/8ZwB8D+ByA+0Xkc2nGENGLALZa13YA2K+qGwHsD9pZMQngUVW9AcAWAH8dfF+zHPMYgC+p6k0AOgBsFZEtyHbMoZjXVeVbbqeb16qa2h8AtwHYN6v9OIDH04xhHrG2ATgyq30MQGvweSuAY7WOcY7Y9wC425eYASwB8CaAW32J2YqfeZ1e/N7kdhp5nfYUynoAH85q9wbXfLBOVfsAIPjYUuN4QolIG6YrrR9AxmMWkbyIHALQD6BLVTMfcwnM6xT4kttp5nXaA7iEXOOvwSRERJYB+CmAR1T1Yq3jKUdVp1S1A8BVADaLyI01Diku5nWV+ZTbaeZ12gN4L4ANs9pXATibcgxxnRORVgAIPvbXOB6DiBQwneA/UtWfBZczHfMMVR0E8EtMz896EbOFeV1FvuZ2Gnmd9gD+BoCNItIuIvUAvgZgb8oxxLUXwLbg822YnovLBBERAD8EcFRVn531V1mOea2IrAw+bwLwZQDvIsMxz4F5XSW+5XbqeV2Dif17ARwH8B6Ab9V6oaFEjD8B0AdgAtNPVw8CWI3p1eMTwcfmWsc5K94vYvpH9sMADgV/7s14zJ8H8Jsg5iMAvh1cz2zMZb4e5nV1YvYqt9POa+7EJCLyFHdiEhF5igM4EZGnOIATEXmKAzgRkac4gBMReYoDOBGRpziAExF5igM4EZGn/h8vWfef0vC+JgAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 432x288 with 2 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXAAAAC4CAYAAAD61bdSAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAAAPyklEQVR4nO3dfYxc5XXH8d/ZZW3jF1SM18YBN2uDjaCoXcjKJaGqiJCDi6KaqCoKlSr/gepGAokgVNVK/mjS/kNUOciV2lSOsOxWKQkRQaAIxbGsVlabBlgTY6A2fsMUY2MvsRG2CfviPf1jr4vxPo/X83bvHM/3I6125sydeZ67c3x89+6Z55q7CwAQT1fVEwAA1IcCDgBBUcABICgKOAAERQEHgKAo4AAQVEMF3MxWmtmbZrbfzNY2a1JA1chtRGD19oGbWbekvZJWSDos6WVJD7j7/+SeM2/ePO/r65sUf+34seT20985U9fcUJ9lv/tRMr5318yats/JvU6zfKwzGvFha/R16sntaTbdZ2hWo0M31fBvp3/eXZkfUddo+nX8iswAmdJxxVDr/93aTT3J+NjZ9DHpzTNPJuMHhuck4zdMP1XTfA6P5nP7g+Erk/Ere9I/8I8+njYpNvbrkzp76sykNy731lyK5ZL2u/tBSTKzH0paJSmb5H19fRocHJwUX7x+XXL7Gx/9ZQPTQ622bNmZjN/zmf6ats/JvU6zvOjbmvVSNef2DM3S79vdzRq/KfZ+c3kyPmdv+p/9rPfGk/HfzEsXRRtLjzv/n34x9eQa1LNhYTJ+7HS6IL90+9PJ+P0H0+/Z00tqy6W/eu+27GM/PXBrMv471x5NxnfsWTwp9t7f/UNy20ZOoVwn6Z3z7h8uYkB05DZCaKSAp34Pm/RLlZmtMbNBMxscGhpqYDigNDXn9qiGS5gW8GmNFPDDkhadd/96SUcu3MjdN7j7gLsP9Pb2NjAcUJqac7tH00ubHHBOI+fAX5a01MwWS3pX0lcl/Vk9L/TWI48l44vFufEytfocdSBNy+0qLfvaSzVt/94jX0jGTy9OnxvvGkn/MXR+TaPWZ/Su9PnjBf+R3j6X2/s2fzb9hCW1zeeZ/0r/vUGSpp3oTsZfPTg7GZ89NPnn2vVx+mdddwF39zEze1jSFkndkja6+xv1vh7QLshtRNHIEbjc/QVJLzRpLkDbILcRAZ/EBICgKOAAEBQFHACCaugceKtdzt0p+5+4IxmPtA/ZT2ge2VnqPNAc165v/ScoWy3XnZKzdPUryfg96k/Gc7nd80H+WLgn86n8aR9e+pIGllm2gCNwAAiKAg4AQVHAASAoCjgABEUBB4Cg2roLJafW7pSLqarro8puk9xf0pu1FgprqqAqteb2299Or/8yNju9/ssN29LrfvfuyV8Yp3sks5ZMZj11S1xkp2sk/focgQNAUBRwAAiKAg4AQVHAASAoCjgABBWyCyUn150iSSu6/rTEmbQ3ukQQ3b7Ntyfj9x+8Jhl/+9s3JeOz3k13d4xclT62HR6dkYxPO302GZekrtH0GJZuTlHX6OQHLPPyHIEDQFAUcAAIigIOAEFRwAEgKAo4AARFAQeAoBpqIzSzQ5JOSToraczdB5oxqVbYOv7jZHzx+toWwIp0ybNaL21Ge+EnIuV2Jzq4YmNN29/44tJkPNcu2D2Sfp3p72cugzaWX8wq91iqXVCSxrvTY6Q0ow/8i+7+fhNeB2g35DbaGqdQACCoRgu4S/q5me0wszWpDcxsjZkNmtng0NBQg8MBpakpt0c1XPL0gMZPodzp7kfMbL6krWa2x923n7+Bu2+QtEGSBgYG8ieKgPZSU25fZXPJbZSuoSNwdz9SfD8u6VlJy5sxKaBq5DYiqPsI3MxmSepy91PF7S9J+tumzawkuQWw2nHxq1q7SlCfenJ72eeWaOvg5E6ndsyjqvT/Kv/YdxbsbOnY473ptpLh0enJeK7bJLcA1XjPRTpHMr+b2dn0c8anJ46rM4fajZxCWSDpWTM79zr/5u4/a+D1gHZBbiOEugu4ux+U9HtNnAvQFshtREEbIQAERQEHgKAo4AAQ1GV1SbVmatbaKTn1rKnCWiWI7KdPfyH72O6V1ybjb25fnIyP/la6HeRP7nwpGZ+/ZVoynrsUWm79kly3ycx3f5OMTzwpPVcbS8e9a/JxtWXWTeEIHACCooADQFAUcAAIigIOAEFRwAEgKLpQahRp7RRUL9fNdDnny1uPfz4Zn/NWfsHGPUcWJOMzPsisF9KTPvY8cHpeMt7zUXrs7uFcPN2d4l2ZNVJGxpLxiSelx8h1oahr8vaW+dFxBA4AQVHAASAoCjgABEUBB4CgKOAAEBRdKE3Sid0GQMrYrHR3xcic7uxzrujJrEkymt5+RuaKOb/a05eML8p0gnRl1hgZ767hajlKr19yjp3NdbQ0fvzMETgABEUBB4CgKOAAEBQFHACCooADQFBTdqGY2UZJX5Z03N1vLWJzJf1IUp+kQ5Lud/eTrZtmXHSntC9yuzWuOJM+Lpx2Kr8Wyskjs5Lx7vSFdDQ6Jx2fec1HyfjZntnJeFemqyR3RR7lduEih8KudPeNKd2dUotLOQLfJGnlBbG1kra5+1JJ24r7QDSbRG4jsCkLuLtvl3TigvAqSZuL25sl3dfcaQGtR24junrPgS9w96OSVHyf37wpAZUitxFGy/+IaWZrzGzQzAaHhoZaPRxQGnIbVau3gB8zs4WSVHw/ntvQ3Te4+4C7D/T29tY5HFAachth1LsWyvOSVkt6vPj+XNNm1CFy3SmL169r2hg3PvrLpr1WB6krt/fuOBi+syiXk7Wq5+eQvo5OHPn+mvwVinLGZk9en+Xj76Q7WaY8AjezpyT9t6SbzOywmT2oieReYWb7JK0o7gOhkNuIbsojcHd/IPPQ3U2eC1AqchvR8UlMAAiKAg4AQVHAASAorsjTZt565LHsY1G6HLYc2ZmM3/OZ/lLn0ema1VWCT+Ry+4/3XbgiwyfGXk1f9ad73nAyfuX0yZch6spdsSg7KgCgrVHAASAoCjgABEUBB4CgKOAAEBQFHACCoo0wkCiXZ6NdEJervz7Wn4wf+NmS7HOuPpFb6urKZHRkzszJwdN1LmYFAGhPFHAACIoCDgBBUcABICgKOAAERRfKZaDWy7PlLrW2/4k7atoe6DQ7b0vHr9cvWjruO34mGecIHACCooADQFAUcAAIigIOAEFRwAEgqCm7UMxso6QvSzru7rcWsW9J+gtJQ8Vm33D3F1o1SdQnd3m2xaqtO+Vy1czcXva5Jdo6OLkbqFnr1HB5tLgO/P3nk/FZhy0ZP903+RJsw+vS/zYv5Qh8k6TUBd+ecPf+4ovijYg2idxGYFMWcHffLulECXMBSkVuI7pGzoE/bGa7zGyjmV2d28jM1pjZoJkNDg0N5TYD2gm5jRDqLeDfk3SDpH5JR6XMSVVJ7r7B3QfcfaC3t7fO4YDSkNsIo64C7u7H3P2su49L+r6k5c2dFlANchuR1LUWipktdPejxd2vSHq9eVNCq+W6U1Y82l5X9qlCs3O71qso0W3S3vb+c/r/8zl786V0zqF0fMbJyd0mkmTjk4+ru4fTr3EpbYRPSbpL0jwzOyzpbyTdZWb9klzSIUl/OdXrAO2G3EZ0UxZwd38gEX6yBXMBSkVuIzo+iQkAQVHAASAoCjgABMUVefD/ar2yT06nralyMbWuhUJ3Sntb9rWXWj7GVYnYIa7IAwCXFwo4AARFAQeAoCjgABAUBRwAgqILBVPKrp3SpKvNXM5YCwWtxBE4AARFAQeAoCjgABAUBRwAgqKAA0BQdKGgbs1aO0Vi/RSgHhyBA0BQFHAACIoCDgBBUcABICgKOAAENWUXipktkvQvkq6VNC5pg7uvN7O5kn4kqU/SIUn3u/vJ1k0VUURZO6XK3O7ENU/q2edac6bWtWeiu5Qj8DFJj7n7zZLukPSQmd0iaa2kbe6+VNK24j4QCbmN0KYs4O5+1N1fKW6fkrRb0nWSVknaXGy2WdJ9LZoj0BLkNqKr6Ry4mfVJuk3Si5IWuPtRaeIfgqT5meesMbNBMxscGhpqcLpAa5DbiOiSC7iZzZb0jKSvu/uHl/o8d9/g7gPuPtDb21vPHIGWIrcR1SUVcDPr0USC/8Ddf1KEj5nZwuLxhZKOt2aKQOuQ24hsygJuZibpSUm73f275z30vKTVxe3Vkp5r/vSA1iG3Ed2lLGZ1p6Q/l/Same0sYt+Q9Likp83sQUn/K+ny7NNB01ysjayeBbAuNLyu5gWxyG2ENmUBd/f/lGSZh+9u7nSA8pDbiI5PYgJAUBRwAAiKAg4AQVHAASAoLqmGttCMBbB+7WeaNR00oIyFujpxMbAUjsABICgKOAAERQEHgKAo4AAQFAUcAIKiCwVtrdMukQXUgiNwAAiKAg4AQVHAASAoCjgABEUBB4Cg6EJBSKnuFDPbUcFUgMpwBA4AQVHAASAoCjgABEUBB4CgKOAAEJS5e3mDmQ1Jeru4O0/S+6UN/omqxq1y7E7Z58+6e29JY31Kh+d2p+RXleMmc7vUAv6pgc0G3X2gU8atcuxO3Ocqddr73In51S55zSkUAAiKAg4AQVVZwDd02LhVjt2J+1ylTnufOzG/2iKvKzsHDgBoDKdQACCo0gu4ma00szfNbL+ZrS157ENm9pqZ7TSzwRaPtdHMjpvZ6+fF5prZVjPbV3y/uqRxv2Vm7xb7vdPM7m3BuIvM7N/NbLeZvWFmjxTxlu9zu+iE3K4qry8ydkfndqkF3My6Jf2jpD+SdIukB8zsljLnIOmL7t5fQgvQJkkrL4itlbTN3ZdK2lbcL2NcSXqi2O9+d3+hBeOOSXrM3W+WdIekh4r3tox9rlwH5fYmVZPXubGlDs7tso/Al0va7+4H3X1E0g8lrSp5DqVw9+2STlwQXiVpc3F7s6T7Shq35dz9qLu/Utw+JWm3pOtUwj63iY7I7ary+iJjt1w753bZBfw6Se+cd/9wESuLS/q5me0wszUljnvOAnc/Kk0khaT5JY79sJntKn4NbemvembWJ+k2SS+q2n0uUyfndtXvccfmdtkF3BKxMttg7nT32zXxa+5DZvaHJY5dpe9JukFSv6Sjkta1aiAzmy3pGUlfd/cPWzVOGyK3q9HRuV12AT8sadF596+XdKSswd39SPH9uKRnNfFrb5mOmdlCSSq+Hy9jUHc/5u5n3X1c0vfVov02sx5NJPgP3P0nRbiSfa5AJ+d2Ze9xp+d22QX8ZUlLzWyxmU2T9FVJz5cxsJnNMrM5525L+pKk1y/+rKZ7XtLq4vZqSc+VMei5JCt8RS3YbzMzSU9K2u3u3z3voUr2uQKdnNuVvccdn9vuXuqXpHsl7ZV0QNI3Sxx3iaRXi683Wj22pKc08SvdqCaOzh6UdI0m/lq9r/g+t6Rx/1XSa5J2aSLpFrZg3D/QxCmDXZJ2Fl/3lrHP7fLVCbldVV5fZOyOzm0+iQkAQfFJTAAIigIOAEFRwAEgKAo4AARFAQeAoCjgABAUBRwAgqKAA0BQ/wf3A6ub/owxNAAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 432x288 with 2 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXAAAAC4CAYAAAD61bdSAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAAAPHklEQVR4nO3dXYxc9XnH8d+zL7aJTSsbL9QxJrtxbAnaKk66ARqqiIgmotyYXLSKLypXQnKiggqVU8VqpCTqFY1KqKO2CY5AmColLwoIX6A2rlUJVSUuC3JsEye2AxT8ot0lJvH7vj692GOxMed/dnfmzDnzzH4/0mpn/mdmzrPjx789O/Of/zF3FwAgnq66CwAANIYAB4CgCHAACIoAB4CgCHAACIoAB4CgmgpwM7vbzH5uZsfNbEdZRQF1o7cRgTU6D9zMuiUdlfQpSSckvSRpi7v/NHWf1atXe39/f+62QyPDueNL37rQUH1YfC7rgsZ9zJp9nEZ6e4kt9WVa3uyuazF2Y37dXZMFd5pOb+qayh+3xLgkTS3NH++5nM4nt/Q/9XRP6vEKCi9gUw3k5HRB7T2JY+dEHl8e+5XGJy++5wdO/Jjzcquk4+7+miSZ2XclbZaUbPL+/n4NDQ3lbhvY+Uju+If++sdNlIjFZL/vK+uhFtzby7Rct9ldZe2/Ur946A9zx5e9nQ7I7svpx1v66/wQWvrrdHj+6kPdueOrjqR/i0z3puu7tDo/IFf+LF24FQRu94Xx/A0FB8B2KXEfSZPXrcgd75rI/y3341cfy799cg9zWyvprVnXT2RjQHT0NkJoJsDzfv2959eRmW0zsyEzGxodHW1id0BlFtzbExqroCzgNzUT4CckrZt1/UZJp66+kbvvcvdBdx/s6+trYndAZRbc271KvIgLtFAzAf6SpA1mNmBmSyR9VtKecsoCakVvI4SG38R090kze0DSf0jqlvSEu7/a6OO9/uD23PEB5b+5KfEGJ1qj7N5ud+v/5sXc8WO7P5q8j19KR8eyU/nbpobTx4vnb85/w++a0d7kfVIzTSTpwtr8NzhXnEzfqWuyYKZJ4g1OK3gTs6tg2+S1+T9X91jiOerK/3mamYUid39e0vPNPAbQjuhtRMAnMQEgKAIcAIIiwAEgKAIcAIJq6k3MKqRmp0jFM1RSmLkCzM+Gra80dL+3vvTx3HEvOFzsOpsfRd3jBR9vL/js1JJ3ErM2LqUXZLGJ9Ef9u8YTH+kvWI/FJgseL7WvBS7VwhE4AARFgANAUAQ4AARFgANAUAQ4AARFgANAUG0/jbBI0RTDT3X9aYWVAJ3n6LduTW77rSPp6Pjt1/PnwvVeLJhWN5l/Rp73DafPalOkZyy/vp6z6bmHRdP+LDWNsICNTSS3pepInbotNc4ROAAERYADQFAEOAAERYADQFAEOAAERYADQFChpxEW2Tv9g9zxgZ0LX8FQYhVDLD4bP/+/pT7e0V0fS2774w8fzB1/8ZkPJ+/TfTm9r4vvz5929/6J5cn7dI2npxH2XMxfxdC706sR9pxPT4E8359fR+q8nFOv5x9rcwQOAEER4AAQFAEOAEER4AAQFAEOAEE1NQvFzN6QdE7SlKRJdx8so6hWYgEszEfE3m4XR/8lfxGsnnfyF6ySpP88dHPu+HW/TJ8Ts+dyeptN5x+b9lxInxOzeyy9rWs8f9t0T/oY2CbSj9eTWNjLEhNhUuNlTCP8pLu/XcLjAO2G3kZb4yUUAAiq2QB3ST8ys5fNbFsZBQFtgt5G22v2JZQ73P2UmV0vaa+Z/czdX5h9g6z5t0nSTTfd1OTugMosqLeX6X111IhFrqkjcHc/lX0fkfSspPe8e+Huu9x90N0H+/r6mtkdUJmF9navllZdItB4gJvZcjO79splSZ+WdLiswoC60NuIopmXUG6Q9KyZXXmcf3P3fy+lqpqkFsCS0otgschVR+q43q7Sxr8sdxGslNefTi909Re/m///8geP3ZW8z5Jz6WmJvRfy5/FN96QXs1r2y3S8vv37vbnjPRfzbz/1cv5+Gg5wd39NUvoZBIKitxEF0wgBICgCHACCIsABICgCHACCIsABIKiOPSdm2VKrGA6Ic2xC2vgHH9TeofxpqKxy2RoDW36S3Lb6yLnc8YkV6cfruZTeNr4i/1h38pr0fbon0vG69u//J3f8+D/enjs+lficGEfgABAUAQ4AQRHgABAUAQ4AQRHgABAUs1CaxDk2MZfUImlF/VG0sBp9NePot/LPvSlJO396IXf8mjPpBauWnC84x+ZU/rbuifRiVt2XEieylPTmlz+eO75sJP/2XROJ8eQeAABtjQAHgKAIcAAIigAHgKAIcAAIigAHgKCYRthCnGMTaJ2Nny/33JvHvnFbcltXYrrg+u3p/6+nt+dPFZSkm/4ufzGrlJOePy2SI3AACIoAB4CgCHAACIoAB4CgCHAACGrOADezJ8xsxMwOzxpbZWZ7zexY9n1la8sEykdvIzpzT6/AJUlm9glJ5yU95e6/l419TdIZd3/YzHZIWunuX5xrZ4ODgz40NFRC2Z0rNb2wUYtpWuJ+36ezfia9PNxVovZ2ajVCVjDsXKnenvMI3N1fkHTmquHNknZnl3dLurfZAoGq0duIrtHXwG9w99OSlH2/vrySgFrR2wij5W9imtk2Mxsys6HR0dFW7w6oDL2NujUa4MNmtkaSsu+J80hI7r7L3QfdfbCvr6/B3QGVobcRRqMBvkfS1uzyVknPlVMOUDt6G2HMuZiVmT0t6U5Jq83shKSvSHpY0vfN7D5Jb0riLe6ScI7N6kTt7aLZJmjcyS+mF5+6uG4qd3zDA/uT9zn62MeS2zZ+7qX5F1ZgzgB39y2JTXeVUgFQE3ob0fFJTAAIigAHgKAIcAAIigAHgKAIcAAIinNiBpKaPsb0QqB5l/umk9u8q3jRvzxLh1sfrxyBA0BQBDgABEWAA0BQBDgABEWAA0BQzELpAEWLGxWdoq3dT7d2/NHbc8fbvW7EtP4L5fbVB778YqmPl4cjcAAIigAHgKAIcAAIigAHgKAIcAAIigAHgKCYRtjhis6xOaD0FMOUKqfwMV2wPEVTTVOLoTVyH1SLI3AACIoAB4CgCHAACIoAB4CgCHAACGrOADezJ8xsxMwOzxr7qpmdNLMD2dc9rS0TKB+9jejmM43wSUn/JOmpq8Yfdfd/KL0iVCY1xXARTRF7UvR24XRBNO7YzvzVNCVpw4PlTJGd8wjc3V+QdKaUvQFthN5GdM28Bv6AmR3M/gxdWVpFQP3obYTQaIB/U9J6SZsknZbSH+kzs21mNmRmQ6Ojow3uDqgMvY0wGgpwdx929yl3n5b0bUm3Ftx2l7sPuvtgX19fo3UClaC3EUlDAW5ma2Zd/Yykw6nbApHQ24hkzlkoZva0pDslrTazE5K+IulOM9skySW9IelzrSsRVWv0HJsp7booFb2NViprpkmROQPc3bfkDD/eglqAStHbiI5PYgJAUAQ4AARFgANAUAQ4AARFgANAUJwTEwtSdI7NRbQI1qJX9jk2F/pYnerYN27LHR/7Wv6URI7AASAoAhwAgiLAASAoAhwAgiLAASAoAhwAgmIaIUqTmiZWtIJhu65UCNRhw1/tzx0/4xdyxzkCB4CgCHAACIoAB4CgCHAACIoAB4CgmIWClitaAGtAnXOOzcWkkUWmFtvCVFXgCBwAgiLAASAoAhwAgiLAASAoAhwAgiLAASCoOacRmtk6SU9J+h1J05J2uftOM1sl6XuS+iW9IenP3P2d1pWKTlTnOTbp7ca1+zkxU/vqtKmM8zkCn5S03d1vlnS7pPvN7BZJOyTtc/cNkvZl14FI6G2ENmeAu/tpd38lu3xO0hFJayVtlrQ7u9luSfe2qEagJehtRLeg18DNrF/SRyTtl3SDu5+WZv4jSLo+cZ9tZjZkZkOjo6NNlgu0Br2NiOYd4Ga2QtIPJT3k7mfnez933+Xug+4+2NfX10iNQEvR24hqXgFuZr2aafDvuPsz2fCwma3Jtq+RNNKaEoHWobcR2ZwBbmYm6XFJR9z967M27ZG0Nbu8VdJz5ZcHtA69jejmsxrhHZL+XNIhMzuQjf2tpIclfd/M7pP0pqTOmp+D2i30HJtjjyx4lUJ6W41N+2v31Qg7bbpgypwB7u7/LckSm+8qtxygOvQ2ouOTmAAQFAEOAEER4AAQFAEOAEFxTkyEk1oAyx76wssVl9IRGllkqhOVPeumChyBA0BQBDgABEWAA0BQBDgABEWAA0BQBDgABGXuXt3OzEYl/V92dbWktyvbeT5qeFc71NFsDR9w91oW5qa3qaHFNeT2dqUB/hs7Nhty98Fadk4NbVlHO9RQhnb4OahhcdTASygAEBQBDgBB1Rngu2rc9xXU8K52qKMdaihDO/wc1DCjo2uo7TVwAEBzeAkFAIKqJcDN7G4z+7mZHTezHTXV8IaZHTKzA2Y2VNE+nzCzETM7PGtslZntNbNj2feVNdTwVTM7mT0XB8zsnhbXsM7M/svMjpjZq2b2YDZe6XNRtnbo66wOevvdsY7u7coD3My6Jf2zpD+RdIukLWZ2S9V1ZD7p7psqnGb0pKS7rxrbIWmfu2+QtC+7XnUNkvRo9lxscvfnW1zDpKTt7n6zpNsl3Z/1QNXPRWnarK8lenu2ju3tOo7Ab5V03N1fc/dxSd+VtLmGOirn7i9IOnPV8GZJu7PLuyXdW0MNlXL30+7+Snb5nKQjktaq4ueiZIu2ryV6e1YNlfZ2HQG+VtJbs66fyMaq5pJ+ZGYvm9m2GvZ/xQ3uflqa+ceXdH1NdTxgZgezP0Mre+nCzPolfUTSfrXPc9GIdulrid6+Wsf2dh0BbjljdUyFucPdP6qZP3nvN7NP1FBDu/impPWSNkk6LemRKnZqZisk/VDSQ+5+top9tlC79LVEb8/W0b1dR4CfkLRu1vUbJZ2qugh3P5V9H5H0rGb+BK7DsJmtkaTs+0jVBbj7sLtPufu0pG+rgufCzHo10+DfcfdnsuHan4smtEVfS/T2bJ3e23UE+EuSNpjZgJktkfRZSXuqLMDMlpvZtVcuS/q0pMPF92qZPZK2Zpe3Snqu6gKuNFbmM2rxc2FmJulxSUfc/euzNtX+XDSh9r6W6O2rdXxvu3vlX5LukXRU0i8kfamG/X9Q0k+yr1erqkHS05r5M25CM0ds90m6TjPvSh/Lvq+qoYZ/lXRI0sGs0da0uIY/0szLCwclHci+7qn6uWjBz1VrX2c10NuLqLf5JCYABMUnMQEgKAIcAIIiwAEgKAIcAIIiwAEgKAIcAIIiwAEgKAIcAIL6f9Wtat8DWiv4AAAAAElFTkSuQmCC",
      "text/plain": [
       "<Figure size 432x288 with 2 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXAAAAC5CAYAAAAxiWT3AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAAAUGElEQVR4nO3dW2xc13UG4H/NcIakKCkSJUqmLTVUaim1ESeyy9iyG6BBHMNKXpQCbWE/tHowIrhJEbtxCyu9GDBQtG4LO2iaAoFSu5YBI4Fbp7VaBDUENk6R1pZFO4pvskj5LksRKcm68D6X1QeOSK7F4Vw4M2fOJv8PEMh1zsw5e6jNhc01e/YWVQUREYUn0ewGEBHR4jCBExEFigmciChQTOBERIFiAiciChQTOBFRoGpK4CKyU0SOichxEdlbr0YRNRv7NoVAFjsPXESSAAYA3AbgBIDDAO5U1Tfq1zyi6LFvUyhaanjujQCOq+rbACAiPwSwC8CCnXz9+vXa09MzE786dNqcb/1gtIbm0HI3gVFM6aTU4VJV9+20tGobOupw68pkrrD3krx7gIs1aeOWCTtwk5yN8y32j/OEO59LuR+zCxNZ9/i0fYAW+dvftzE16troX5O7pybtAcm752fsBcSPXf1gVtwN8q4BCfci3P2QcK95fAKLtVDfriWBXwXggznxCQA3lXpCT08P+vv7Z+Itf/+wOX/1H71QQ3NouTukffW6VNV9uw0duElurdf9yzpx1y0mTl2y51vGbDKZ+pj93V87kDVx+lLGxBPr0iZuPWfPj2yy5/Mt9vrtZ3ImvvgrNtXk2jHP5Brb5isO2WukRm2bs20242dX2ISanLTXa//lmIkl6xJ6xt5PXQKXiUl7vq3Vnp+yPyNdYc/njyz+D7iF+nYtNfBiI5159RgR2SMi/SLSPzw8XMPtiCJTdd/OYLLIU4gaq5YR+AkAm+fEmwCc9A9S1X0A9gFAb2+v+SV45577zGO3gCNyKu34t3eYuEF9pOq+vVo6I11UaNNf/Z+JB753o4lTH9nRaWbDlInTF1MmzrsSx0i3q2c4I5vs2C+7wpdg7PMvXm1Hu/mVdrQLAJ3dF0w8fnydfY4r2+RabZxZYWM/Ak9fsK854Ubc4ksm80oy9jVoq32N4kow+XTpn2E91DICPwxgq4hsEZE0gDsAHKhPs4iain2bgrDoEbiqZkXkDwE8CyAJ4DFVfb1uLSNqEvZtCkUtJRSo6o8B/LhObSGKDfZtCkFNCbzeytXEPdbIlx/+nxe37e4XS54f3H+DifPuN3/eND9Xvs27WOyEEHz8gedN/OFeO0tGO20N/rotH85r49nxFSaeaLPns5nyUxHN49v9a3Jx1tW8U/aCmnI17gn3ov00QkfdVMx6zG/1+FF6IqJAMYETEQWKCZyIKFCxqoF7viZ+W+J3mtQSonjzNe5VP7cF5I7X7OM7huwc6JZRNyc6Z+u/beds/Vfdx8RPfdPWvNtPuznRSfupxFcnN8NLnbXpqOucnXfdMm6vqS575V2N29f1k66GLZPuNft53K59knNz1zNu/Ju15xPuo/v+gwLHH3Gfafhm9e/vcARORBQoJnAiokAxgRMRBSrWNXDvYP5fTOxXM/RCnzP87Mkj847dfuX2yNtB8bd198s1Pf+DP7c17M1/adda8TXuS79mV97btqf071qni4v17VPZERP/pvyJidMXXE173F3ATbTO2bI7Wi/aA8kJtxqhXzK31Y5vW10RO+fWQvHJNNth117xK6MspubtcQRORBQoJnAiokAxgRMRBSqoGrjHeeJElUk9123igRd67Hm7FDfe+rubTbzqHXu+7aSt73pr/9dWvT+58vQCj5x1z/u7TJx0O4j5LdSSU7YonbBl+Xm7BPmJ3b7m7Wvo89ZO8bvIldmSzc8rr9bceeKTDxevl3METkQUKCZwIqJAMYETEQVKtMY6TTV6e3t17q70jcZd78NTy56Xh7QPF/VcI5ZdLmu1dGqUu9IvR4PfucnErefszOp8i6uJT9mu0PmmLYInp9xaK2Nu3063B2f6vC2y59N2/NsyYs9nVqXt+f9+CYu1UN/mCJyIKFBM4EREgWICJyIKVNDzwMuJ2x6btdR3l4tQfybbfv0TONg/u1YPP5NQf1u/cajk+fcedPtwupp4xu2RmU+WHr/mXA08MelWM3FroufdHpgN2QTT4QiciChQTOBERIFiAiciCtSSroF7zV47JdT6LlXPr13v+1q58zTfL//9GhPnXlhr4rYz9vHZDluETo27eeCTNk5k3Xrgvgbu107J+rVY7J6Y+ZxfAbw6H+6dreln/plroRARLSlM4EREgWICJyIK1LKqgXvLbY9NopCNDq4x8Zozbv1tW4JG2zl7PjXqHuBK2qnRrImT43Z8m5iwz5ec21Nzyj6/xW7x6W9X1uTa2WfkFyincwRORBQoJnAiokCVTeAi8piIDInIa3OOdYrIQREZLHxdW+oaRHHEvk2hq6QG/jiA7wJ4Ys6xvQD6VPUhEdlbiO+vf/Oi1ex54jTfsyePmPj2K7fX8/KPI6K+7d9vqfbxS60vDnz/s/OOXXP1hyZ+t6/HxB0n7eNTo36TSxu2TNiqc9LNA/cS47aGLUlfA7fnPcnO23TThL4G7vv2oxeuMPF3Bz6a+T7Z7ur3l9tUskUAVPV/AJxzh3cB2F/4fj+Ar5S7DlHcsG9T6BZbA9+oqqcAoPB1Q/2aRNRU7NsUjIa/iSkie0SkX0T6h4eHG307osiwb1OzLXYe+GkR6VbVUyLSDWBooQeq6j4A+4DpPTEXeb+m4DzxZWlZ9O1m2/bVw/OO+SrvZtii9+ATN5hYDreZOJGx/wX5pF+vO+XO2/u1pUov4J1ss0+QjKt5u/upXx+8jL99+rdse87OXk8vFZ8IvtgR+AEAuwvf7wbwzCKvQxQ37NsUjEqmEf4AwPMAPikiJ0TkLgAPAbhNRAYB3FaIiYLCvk2hK1tCUdU7Fzh1a53bQhQp9m0K3bJeC6VanCcevTrP+46taueJh27wOzfNO6ar3DzrjCsQuPW3W8Zc7Od9Z+zTfY1c/LRt9y6Guj0vVdz64Hn3BLdeuLgLHnNz3z/3yidMvOo9e7n0xdkGJqdQFD9KT0QUKCZwIqJAMYETEQWKNfAaVDtP3OO88fIavBZKbJTbM3Op2fqNQ3W/5ltPXm9iOWHnibeM2fFqPm1r1KvfcuNZV+L2NfZE1qbP9EW3J2bKXm/bV180se/bv/rG3SZuG559fq4VRXEETkQUKCZwIqJAMYETEQWKNfA6isM88aVWMw69/ZVa6jXvevB9+/rDd5g4f8HO025x87yn1tgD+TV2ovjUkC00J9w8cl+HTrs9L3Ntdjzs55EPPNpr4jve6TTxxwbs41OjszV335aZ48UPExFR3DGBExEFigmciChQrIE3UDP2NQy9ZuzrnF7or48W73vnrzJxTm3N+MoN5008dHKjidMf2fFqbiJt4vaztkbutrREcsrOA1c3/E1OuvXI7fLjeOdL/4RSrrvd7on50ZmOme+zPy2+3DxH4EREgWICJyIKFBM4EVGgWAOPEPfYLG+p1rjLrXXCteXL+7dru0zcjaMlH78Fb5c8//ZDN5t49Aq/Vop9fPvp0uuJ+7VSJlfb65Xr21fiDRN/8Be3zN5rqvh+nRyBExEFigmciChQTOBERIFiDbyJ4rB2CkWj2rVOWCOv3uATN5h4/bpLJj57bJ2JW8bt83N2+XBkVtqaduqSrUOnLxWfm32Z32PTO/Mf20w89dP1Jl717uwFuCcmEdESwwRORBQoJnAiokCxBh4jte6xCSzPueNEALD1918ueX4tBqu63ntPXWfiqZFVJt74D8+beOhrt5h4dLPbc9Nd/18//ZiJd459zd7v+OxaKLm+4m3kCJyIKFBM4EREgWICJyIKFGvgMebniQOcD7xUNXpPzHLzypfjvPOB73/WHnBrm6xptfPIs5P2/Dt/bddSWf2WWy88aR//B4PHTXzPu79t4lzWPiE9PmfeuWvbZRyBExEFigmciChQZRO4iGwWkZ+IyFEReV1E7ikc7xSRgyIyWPi6tvHNJaof9m0KXSUj8CyA+1T1GgA7AHxdRK4FsBdAn6puBdBXiIlCwr5NQSv7JqaqngJwqvD9JRE5CuAqALsAfL7wsP0AngNwf0NaSTOW+ptNUW5qzL69vK3ZYN+kHHvV/qE1etbGK0fsm5TZDr/Jgj3fMmLPf6VjxMZb/8vEfZvsm5gPrNs18/2JH2ZQTFU1cBHpAXA9gEMANhZ+AS7/Imyo5lpEccK+TSGqOIGLyEoATwO4V1UvVvG8PSLSLyL9w8PDi2kjUUOxb1OoKkrgIpLCdAd/UlV/VDh8WkS6C+e7AQwVe66q7lPVXlXt7erqKvYQoqZh36aQla2Bi4gAeBTAUVV9ZM6pAwB2A3io8PWZhrSQSlpqGyVHuakx+/bytmHXmw29/joXb7lijz3Q4ha7ej1l4tbzs+f1nD03c4kK2vEbAH4PwKsicqRw7E8x3bmfEpG7ALwPYGm9m0bLAfs2Ba2SWSg/A1B8T3vg1vo2hyg67NsUOn4Sk4goUFzMaomJeqNkP287yhr2clLtYlTVXq/Wxy+1zyMA8/v2hbzdBfl3N9nFrAa+d6OJuzZ/ZOIVP3Pp1v3t137GrljVenE2TmSL75DMETgRUaCYwImIAsUETkQUKNbAl7haN0ouN2+cNW9aqqrt29vufrHk+bH77Ye9xJW1c2lbFM+2z46vNVF8shRH4EREgWICJyIKFBM4EVGgWANfZqKeJ06NEfUmyLU+n/0MyKxyRW9X1k5k7IH8nOVP8m6D5Jnn1KFdRETUBEzgRESBYgInIgoUa+DLHGuVRNFoO2Nr3MlJt4fmmI3TI3PWQskVvyZH4EREgWICJyIKFBM4EVGgWAMno957bB7/9o6qHk+0VK1+zxay1Q2f0xeyJk5OzqmBZ+xa4TPH69M0IiKKGhM4EVGgmMCJiALFGjiVVOvaKax5Lw+N2JNzqX0mwe9r6df/TuTcWilafB9M85yaW0VERE3BBE5EFCgmcCKiQLEGTlVp9B6bREtV+mKm5PnkmJ0HLpnZeePi6+MFHIETEQWKCZyIKFBM4EREgWINnGrCPTapEvXYwzP0tes1Yed9S97WtdXtkenCojgCJyIKVNkELiJtIvKiiPxCRF4XkQcLxztF5KCIDBa+rm18c4nqh32bQlfJCHwSwBdU9TMAtgPYKSI7AOwF0KeqWwH0FWKikLBvU9DK1sBVVQGMFMJU4Z8C2AXg84Xj+wE8B+D+ureQghJSnZJ9m6LUMmLngfuad2LMnpfcnPXDF1gXpaIauIgkReQIgCEAB1X1EICNqnpq+tp6CsCGSq5FFCfs2xSyihK4quZUdTuATQBuFJFPVXoDEdkjIv0i0j88PLzIZhI1Bvs2hayqWSiqeh7Tf07uBHBaRLoBoPB1aIHn7FPVXlXt7erqqq21RA3Cvk0hKlsDF5EuABlVPS8i7QC+COBvABwAsBvAQ4WvzzSyoRSmeu+xWU/s29Hx74UsZl54nN9PqUSurbqP3UgmOfO9n0N+WSVX7AawX0SSmB6xP6Wq/ykizwN4SkTuAvA+gLB/urQcsW9T0CqZhfIKgOuLHD8L4NZGNIooCuzbFDp+EpOIKFBcC4UixbVTlieuhQIkx0uvBy5Tbj3wOWuA+3VTLuMInIgoUEzgRESBYgInIgoUa+DUVKHXNYkqletIuQO2ri2ppIkTc/bEXGgeOEfgRESBYgInIgoUEzgRUaBYA6dYifPaKaUMvPR20PX7cu9FlJvHXe1rr2ReeLnH1GNueZSq/RmZCrlOFH0MR+BERIFiAiciChQTOBFRoFgDp1hbqmunRD3/vdp6ca315dDq06HiCJyIKFBM4EREgWICJyIKFGvgFJRS88QnH47HnPBKLJVaPjUXR+BERIFiAiciChQTOBFRoFgDp6DNnScu9/7xS01sSl1VO0+82fOum33/5YojcCKiQDGBExEFigmciChQoqrlH1Wvm4kMA3gPwHoAZyK7cfXYvto0q30fV9WuJtyXfbt+2L7iivbtSBP4zE1F+lW1N/IbV4jtq03c29dIcX/tbF9t4tY+llCIiALFBE5EFKhmJfB9Tbpvpdi+2sS9fY0U99fO9tUmVu1rSg2ciIhqxxIKEVGgIk3gIrJTRI6JyHER2RvlvRciIo+JyJCIvDbnWKeIHBSRwcLXtU1q22YR+YmIHBWR10Xknpi1r01EXhSRXxTa92Cc2heluPXtOPfrQlvYt+sgsgQuIkkA/wjgSwCuBXCniFwb1f1LeBzATndsL4A+Vd0KoK8QN0MWwH2qeg2AHQC+XviZxaV9kwC+oKqfAbAdwE4R2RGj9kUipn37ccS3XwPs2/WhqpH8A3AzgGfnxN8C8K2o7l+mbT0AXpsTHwPQXfi+G8CxZrex0JZnANwWx/YBWAHgZQA3xbF9DX7tsezbofTrQnvYtxfxL8oSylUAPpgTnygci6ONqnoKAApfNzS5PRCRHgDXAziEGLVPRJIicgTAEICDqhqr9kUklL4dy/8X9u3FizKBS5FjnAJTARFZCeBpAPeq6sVmt2cuVc2p6nYAmwDcKCKfanKTmoF9e5HYt2sTZQI/AWDznHgTgJMR3r8ap0WkGwAKX4ea1RARSWG6gz+pqj+KW/suU9XzAJ7DdN01du1rsFD6dqz+X9i3axdlAj8MYKuIbBGRNIA7AByI8P7VOABgd+H73Ziuz0VORATAowCOquojc07FpX1dIrKm8H07gC8CeDMu7YtQKH07Nv8v7Nt1EvGbAV8GMADgLQB/1uw3Jwpt+gGAUwAymB5J3QVgHabfYR4sfO1sUts+h+k/xV8BcKTw78sxat+nAfy80L7XADxQOB6L9kX8s4hV345zvy60j327Dv/4SUwiokDxk5hERIFiAiciChQTOBFRoJjAiYgCxQRORBQoJnAiokAxgRMRBYoJnIgoUP8PAFLTTjGv0OoAAAAASUVORK5CYII=",
      "text/plain": [
       "<Figure size 432x288 with 2 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXAAAAC5CAYAAAAxiWT3AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAAAUqklEQVR4nO3df5BW1XkH8O+zv9hf4LKy4Iqki0gc/LnGBTV2GqKi1NhIEpyJHRvaYWo60RnN2FaSdNpkxmZM1GBmYjODlZE6Ma2OWqnDRCnVWKslLAYURX6KsLCyCwuyLO6yP57+sRe75567vO++73vvex/2+5lh3j2Hc9/77PJwuJzznnNEVUFERPaUFDsAIiLKDTtwIiKj2IETERnFDpyIyCh24ERERrEDJyIyKq8OXEQWisg2EdkpIssKFRRRsTG3yQLJ9XPgIlIKYDuABQDaAGwAcLuqvl+48IiSx9wmK8ryuHYegJ2quhsARORfAdwKYNQknzJlijY1NX1WfrfjoNdmwr6ePEKi8awXPTipfVKAtxpzblfIBK1ETQFunW4DDRHfY+gZUCKeCQcqM7dpnHzEKXd8PNlrUzLgXjhU5v9xy2D4miGvzVB5aPAhIh4ZdCsHK/17lfa6bSTqgTh0e42Keci9TsVt09t7BP0ne7wL8+nApwPYN6LcBuCq013Q1NSE1tbWz8ozf/6I1+aC7/5vHiHReLZe1xXqrcac25WowVVyfaHun1qdt13j1ZX0u+XSPv+6rotD1wz4bX6w+Fmn/NiPb/PaVHa5vXNvfanXpqLb7TEru056bXrOmeCUS0/6HW95txvkJ7MqvDZ1O9z3Lun3/7Eo7XXfp+/sSq9Nebf7QxysdL+v1vW/8K4B8hsDj3rS8X4KInKniLSKSGtnZ2cetyNKzJhzux8RvRZRzPJ5Am8DMGNE+TwAB8KNVHUFgBUA0NLS4vwl+PCe+7w3nQn/qTyT8fTU/vKBTU75pnObixLHGW7MuT1J6sfFpkKfTss8QlXa69c1zd3nlA/3VHttvjXpkFN+aGrUvdwn008botq4z6WlvX4311/jXjdY4b9PSb97r746v81Ajdum5GREPKHH5L46/38NXny17kVRwy4Rbz0mGwDMFpGZIlIB4JsAVufxfkRpwdwmE3J+AlfVARG5G8DLGP5ncaWqvlewyIiKhLlNVuQzhAJVXQNgTYFiIUoN5jZZwJWYRERG5fUEHofwxOaCEv+jRERUHP21/sfkZNCdYAt/5jvKkcO1GdtUHPPnhUv73LoJXf515SfcGMt6B702Fd2hScKSqElM932iJme9zyZJxGRj+HPgEY/N4c+za5arGfgETkRkFDtwIiKj2IETERmVujHwsLVDz3p1HBcnKo5JO/3B2aFyt66k3x+73tXY4LYp88fSwwaq/HuVn3Dfu2+y36YitGVI1Ph2eMy5rNePOfx9VHRHjMmHxtfDZcDfi6W8x//ey4+H9hYQt2sO75Xy2XtH1hIRUeqxAyciMoodOBGRUezAiYiMSv0kZpTwxGah9hXfufzqgrxPrsI7DRKlTfUi/xCWsP37zvbqPlywcsz3mvwVbwNI7P99o1OeOOew16Z9X51TPuv9CV6bo18I7ePd7XeFtR+51128eKvX5r1n5zjl8oiJzorjbt0ns/zn5to2d4fCE6GdGAfWF343QiIiKiJ24ERERrEDJyIyKq8xcBHZA6AbwCCAAVVtKURQY3WmnOwTPl2HY+LFk5bcTpvDb53j1YU3Z6rr8K/7u7mXOuUHpr6b8V71lf4B5/tDQ8xfb9rstVnZda1THqjyT8C5cGa7U9614XMZ49l6aJpXF95wKzzeDfgLgqoO+m0qj7gLgIbKQif9+OuDABRmEvPLqnooczMic5jblGocQiEiMirfDlwBvCIiG0XkzqgGPJWejBpTbvNUeiqGfIdQrlXVAyIyFcBaEflAVV8f2eB0p9ITpdiYcnu8nEpP6ZLvmZgHgtcOEXkBwDwAr5/+qmScCSf7hCc1KTlpzu1iipqAC0+wTfjEb/P0G190yi80Xua1+c4c98f77psXeG3O2uWWV77+Ja9NZbs7AVgdEfO2bdOd8qQDEbsahiYou3bVeW3OPRI+tcffabC0z60T9SdVK471uxWhkKN2eATyGEIRkRoRmXjqawA3AtiS6/sRpQVzm6zI5wl8GoAXZPgMuDIAT6vqbwoSFVFxMbfJhJw7cFXdDeDyAsZClArMbbLC5GZWuThTTvYJL+7hODklSSKGYsMn55Sc9NucNeOoU/7ny/7Fa3PlhAqn/HSzv3FW55C7mOa+69Z4bR596Ran3F/rxyNVoYF78bvCktAhOaW9/ji5lro/kKifT/jEooEJ/sh1Wblbd3KSWx4q5WZWRERnFHbgRERGsQMnIjKKHTgRkVHjZhIzSnhiM22TmtnsRhjVJptdDbOZ/OSEKYUdm+nXabm7UKVmr/9c+NDFzznl8IRllP+57Hmv7qLjdzjlu+r2eW2aFz/mlO/47V96bT688QmnPP/cRV6bj3ZPdcprFj7qtVnc/ddOufKw/72HJ0P7JvsTkqLlTvnE1NAk5ig9NZ/AiYiMYgdORGQUO3AiIqPG9Rh4WNRin6gT7zPJ9WSfXE7gyWZcOtex61yuy3W8nWzYfMfPvbofH7rSKT/zwRVemxur+726TM5/ZalXV/2Be1L8BXv+ymszWOOOyddt8bu5mXDfu7LWX31UdszddGpORbV/ryp35U7vFH98u7o93MZf7VN2wr1uqDzUIHodD5/AiYisYgdORGQUO3AiIqMyduAislJEOkRky4i6ehFZKyI7gtfJ8YZJVHjMbbIum0nMJwH8AsDI7cOWAVinqg+KyLKgfH/hwyu+JE/2ORMm+4x9D09iHOd2Lq58y59YPNlW45SrPvafC+fXL3LK7UcmeW2WzFnvlMMTlgBQ2xY6AedT/16DlW5d1WH/lJwT+92FREPiLyyqPOrOHC7edYPXpqbNLcugP0FZ1eXufKi7/RN5wjEOHnHvXTrKHHDGJ/DgHMCuUPWtAFYFX68CsCjT+xClDXObrMt1DHyaqrYDQPA6NUN7IiuY22RG7JOYInKniLSKSGtnZ2fctyNKzMjc7kdfscOhcSjXhTwHRaRRVdtFpBFAx2gNVXUFgBUA0NLSEn20siHZnOyTzYKcqLHiuBbyFEqcG2elSE65PUnqzed2NrZe+1TGNtds/oZX99ol/z7mex34Rp1Xt+atZqdccU631+b2Czc65af+84+8Ng9/1f0+FtUc99rc297ilB9tbPXaXPkn9U75WE+l16bn/dCRQJf6MfdsmeiU+ye5Y+L9/+1dAiD3J/DVAJYEXy8B8GKO70OUNsxtMiObjxH+GsBbAC4UkTYRWQrgQQALRGQHgAVBmcgU5jZZl3EIRVVvH+W3ri9wLESJYm6TdVyJSURkFHcjLIDwxObQx7O9NrlM5BVqorNQ4tz5kOzaO+BOAM5t2Jvxmoe6Znl1f1O/yym/svYLXpuz9rsLXAb3TPTa/Ns7853ylD3+Qp7vH/mWU/7u9AGvTfVet3t85i92eG1ObJzilMsGvSaY+JE7v32orsZrU93jlkt73Wfr8Kk+n9VHVxMRUdqxAyciMoodOBGRUaKa3PqDlpYWbW31Pww/HoRP9sn11J60K+ZCnvW6Dse0a5SzS+I1XnI7zs3csrH76WanXLKrymvTMPegUz64eZrXZrDWHReffdd6r82sDe6inH+a7v+dLXZu8wmciMgoduBEREaxAyciMoodOBGRUVzIk5DwyT4z8cgoLf+fxYnOQk3q7Fx+tVdn8edBhXX+n24a8zWDT+Z2Kt6uub1O+SY05/Q+ceITOBGRUezAiYiMyvVU+h+KyH4R2RT8ujneMIkKj7lN1uV6Kj0ALFfVhwse0TgRHhMHir9IIk0SGu9+EsxtU7pe+rxTPr5hitem72x3R6ma9/1T4CVi06mwPQ9c45Rvu+UNr82GZv+9k5TrqfRE5jG3ybp8xsDvFpF3gv+G5jbNS5ROzG0yIdcO/JcAZgFoBtAOjP6ZOJ5KT8Ywt8mMnDpwVT2oqoOqOgTgcQDzTtN2haq2qGpLQ0NDrnESJYK5TZbktJBHRBpVtT0ofg3AltO1p+yET/YJ72AIpH8xSzF3IywE5na61d+y3S1j+ygt8/e5a9qc8gNT3/XaFHtxT8YOPDi5ez6AKSLSBuAfAMwXkWYACmAPgG/HFyJRPJjbZF2up9I/EUMsRIlibpN1XIlJRGQUN7NKsajFPmnfBMvSeDfR6ZRcv88pZzPefeg/Pu/VTas97pQHv3wgr7hG4hM4EZFR7MCJiIxiB05EZBQ7cCIioziJaUx4YpM7GBLF48DfftEpf+m2jV6b3/z2Cqdc/Zr/THyg390xcRr8SczwzofnXuW20e9URMbIJ3AiIqPYgRMRGcUOnIjIKI6BGxfeAAuI3gQrk7RvkhUlvHHWvJtOFCcQOiOd+9M3nfKOn/ptZqEwf29KLnQX+7x68YtOeV7l0ejrCnJ3IiJKHDtwIiKj2IETERmVsQMXkRki8qqIbBWR90TknqC+XkTWisiO4JVnB5IpzG2yLptJzAEA96nq2yIyEcBGEVkL4M8BrFPVB0VkGYBlAO6PL1TKlsXFPlEn+YTFsNMhc3uMoibNw/mVTZsz1d5nL/Xqtl77VMbrvr4ztyP5Mj6Bq2q7qr4dfN0NYCuA6QBuBbAqaLYKwKKcIiAqEuY2WTemMXARaQJwBYD1AKadOjsweJ06yjU8uZtSj7lNFmXdgYtILYDnANyrqseyvY4nd1PaMbfJqqwW8ohIOYYT/Feq+nxQffDUCd4i0gigI64gKT8WxiRzGd8OX7NdD4/5PZjbVEiyeaJXd37PUqdcXtXvtSl/u9Yp373YfY7Y298Veb9sPoUiGD7odauq/mzEb60GsCT4egmAF8PXEqUZc5usy+YJ/FoAfwbgXRHZFNR9H8CDAJ4RkaUA9gJI1yMdUWbMbTItYweuqm8AkFF++/rChkOUHOY2WceVmERERnE3wnEqPLGZyw6GgM1dDIniMuOBNzM3ysKOn7jlXtXIdnwCJyIyih04EZFR7MCJiIziGDgB8DfAAtK32IfSKWqhGI3N9sfnOuX/unG5U170le7I6/gETkRkFDtwIiKj2IETERnFDpyIyChOYtKowpNTnNQkikfVnnKn/NW373TKu088Hnkdn8CJiIxiB05EZFQ+p9L/UET2i8im4NfN8YdLVDjMbbIun1PpAWC5qj4cX3iUJlELNnLZBCtFG2Axt8eI8yDxmPGPp98Ea5/2RtZnsx94O4BTB7x2i8ipk7uJTGNuk3X5nEoPAHeLyDsislJEJhc6OKKkMLfJonxOpf8lgFkAmjH8FBP5f2kRuVNEWkWktbOzM/+IiQqMuU1WZdWBR53craoHVXVQVYcAPA5gXtS1qrpCVVtUtaWhoaFQcRMVBHObLMs4Bj7ayd0i0hiMIQLA1wBsiSdESrPwLoaWJrmY22MXNZEd/jPPZnfCqDzhwrGxy+dU+ttFpBmAAtgD4NsxxEcUJ+Y2mZbPqfRrCh8OUXKY22QdV2ISERnFzayooLIZIyWiwuATOBGRUezAiYiMYgdORGQUO3AiIqM4iUmxC09s5rKDIZCqXQzHrWwmpDlpnRw+gRMRGcUOnIjIKHbgRERGcQycEhfeAAvguOl4k82GV7leN55yiU/gRERGsQMnIjIqm1PpK0XkdyKyOTi5+0dBfb2IrBWRHcErj50iU5jbZF02T+B9AK5T1csxfMTUQhG5GsAyAOtUdTaAdUGZyBLmNpmWzX7gCuB4UCwPfimAWwHMD+pXAXgNwP0Fj5DGhWKcxsLcJuuyPROzNDixpAPAWlVdD2DaqWOngtepsUVJFBPmNlmWVQceHPDaDOA8APNE5JJsb8CTuynNmNtk2Zg+haKqRzH838mFAA6KSCMwfAgshp9goq7hyd2UesxtsiibU+kbAPSr6lERqQJwA4CfAFgNYAmAB4PXF+MMlMaXqAUbmTbB6ntkbJtdMbeLZzwttolTNisxGwGsEpFSDD+xP6OqL4nIWwCeEZGlAPYC4J8IWcPcJtOy+RTKOwCuiKg/DOD6OIIiSgJzm6zjSkwiIqPYgRMRGcXdCMmM8C6G4Ymww9qTZDhUYLnuUFiI97U6qconcCIio9iBExEZxQ6ciMgojoGTWeGxTRHZWKRQiIqCT+BEREaxAyciMoodOBGRUezAiYiMkuFDSRK6mUgngI8ATAFwKLEbFwZjjl++8f6BqhZlX1fmdqKsxQvElNuJduCf3VSkVVVbEr9xHhhz/KzFG8Xi92AtZmvxAvHFzCEUIiKj2IETERlVrA58RZHumw/GHD9r8Uax+D1Yi9lavEBMMRdlDJyIiPLHIRQiIqMS78BFZKGIbBORnSKyLOn7Z0NEVopIh4hsGVFXLyJrRWRH8Dq5mDGOJCIzRORVEdkqIu+JyD1BfZpjrhSR34nI5iDmHwX1qY35dJjX8bCW20nndaIdeHB47GMA/hjARQBuF5GLkowhS08CWBiqWwZgnarOBrAuKKfFAID7VHUOgKsB3BX8XNMccx+A61T1cgDNABaKyNVId8yRmNexspbbyea1qib2C8A1AF4eUf4egO8lGcMYYm0CsGVEeRuAxuDrRgDbih3jaWJ/EcACKzEDqAbwNoCrrMQcip95nVz8ZnI7ibxOeghlOoB9I8ptQZ0F01S1HQCC16lFjieSiDRh+KT19Uh5zCJSKiKbAHQAWKuqqY95FMzrBFjJ7STzOukOXCLq+DGYAhGRWgDPAbhXVY8VO55MVHVQVZsBnAdgnohcUuSQcsW8jpml3E4yr5PuwNsAzBhRPg/AgYRjyNVBEWkEgOC1o8jxOESkHMMJ/itVfT6oTnXMp6jqUQCvYXh81kTMIczrGFnN7STyOukOfAOA2SIyU0QqAHwTwOqEY8jVagBLgq+XYHgsLhVERAA8AWCrqv5sxG+lOeYGEakLvq4CcAOAD5DimE+DeR0Ta7mdeF4XYWD/ZgDbAewC8INiTzSMEuOvAbQD6Mfw09VSAGdjePZ4R/BaX+w4R8T7hxj+L/s7ADYFv25OecyXAfh9EPMWAH8f1Kc25gzfD/M6nphN5XbSec2VmERERnElJhGRUezAiYiMYgdORGQUO3AiIqPYgRMRGcUOnIjIKHbgRERGsQMnIjLq/wDLpZJ2BZR+4AAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 432x288 with 2 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "validate_contact_maps(all_contact_dict, 1)\n",
    "validate_contact_maps(all_contact_dict, 13)\n",
    "validate_contact_maps(all_contact_dict, 14)\n",
    "validate_contact_maps(all_contact_dict, 333)\n",
    "validate_contact_maps(all_contact_dict, 26017)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "dict_keys(['num_atoms', 'adj', 'is_contact', 'idx_contact', 'num_contact', '3d_dist_contact', 'path_len_contact', 'cxsmiles', 'smiles'])"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "all_contact_dict[0].keys()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_cxsmiles = [cxs[\"cxsmiles\"] for cxs in all_contact_dict]\n",
    "df = pd.DataFrame({\"cxsmiles\": all_cxsmiles})\n",
    "df.to_csv(OUT_PATH, sep=\"\\t\", index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "3378606it [07:45, 7253.59it/s] \n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "DONE! :)\n"
     ]
    }
   ],
   "source": [
    "# Make sure that `cxsmiles_to_mol_with_contact` works well on all molecules\n",
    "test_df = pd.read_csv(OUT_PATH, sep=\"\\t\")\n",
    "graph_contacts = Parallel(n_jobs=-1)(delayed(try_read_cxsmiles)(\n",
    "    cxs, ii\n",
    "    ) for ii, cxs in tqdm(enumerate(test_df[\"cxsmiles\"])))\n",
    "\n",
    "print(\"DONE! :)\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "num graph nodes 30\n",
      "num atoms no Hs 18\n",
      "num atoms 30\n"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAIAAADCEh9HAAAABmJLR0QA/wD/AP+gvaeTAAAbz0lEQVR4nO3daVgUV9oG4Ldpmk1EQcCgqAiiCAEDiIiSmIQQF8BEBUUTktGARvxijEZAEyXqTAJxGRw1ZlTccEUMgwqoTRC3kWEVF8JiRAUUEZFGtga6z/ejYg9DlB26gef+VVV96vDWdXk9ntpO8RhjBAAAbaUk7wIAALo3xCgAQLsgRgEA2gUxCgDQLohRAIB2QYxC8x49elRaWsotSySSrKws+dYDoFAQo9C8kJCQEydOcMtlZWUuLi7yrQdAoSBGAQDaRVneBUD3kJOTk5CQQETl5eXyrgVAsSBGoUVu374tEAiIqKamRt61ACgWxCi0yIwZMxYtWkRET58+PX36tLzLAVAguDYKbZGenv7bb7/JuwoAhYAYheaZmZkNHTqUW1ZRUbG1tZ08efJbb72VkpIi38IAFAEPMzxBa4nF4rlz50ZGRvbp0ycyMtLZ2VneFQHIE0aj0GqqqqonTpyYP39+ZWWlm5tbRESEvCsCkCfEKLQFn88PDQ396quvxGKxp6dnaGiovCsCkBvEKDTl7t2733zzjWx1zZo1ubm53DKPx9uyZUtQUJBEIvHx8dm0aZOcagSQM8QoNEUkEl27dk22mpiYWFZW1rCBv7//9u3beTzeypUrAwICurxAAPlDjEJ7LVmyJCwsTCAQBAcHL168WCqVtnzf4mJ6Mbql2lpqyzNUV6/SO+/QhAk0YQIdOdL6/QHaC4/fQzPS0tImTpzILd++ffulbebNm9e3b985c+b8/PPPT58+DQwMtLCwaEnnx46Rnx9lZNCoUfT4MXl5UeueoXr0iD7+mM6do5Ej6elTeu89GjyYJk1qTRcA7YXRKDTDxsbm8gt2dnZPnjzZuXOnWCxu1Iy7Za+pqRkREWFpaenm5paYmNiS/t95h778sq3FRUTQrFk0ciQR0YABtHw5HTzY1r4A2ggxCs1TeoGIDh486OvrO2zYsODg4KqqqobNDAwMKioqdHR01NTUzpw54+Dg8N5778XHx7+0z+fPnxcUFBDRpEmkqUnHjrWpssJCGjLkv6vDhlFBQZs6Amg7xCi0ztixY8eMGfP48eOAgAATE5MtW7ZUVlZyP929e5eIJk6ceP/+/cDAQG1t7V9//dXJycna2vrgwYMSiaRhP5mZmXFxcdzyli20Zg1xU0c9eEAVFS2u5rXXqKjov6uPHpGBQfuOD6D1GMCrVVVV5eTkyFZzc3MrKysZY0KhcNy4cdw/IV1d3cDAwLKysh9//JGIli1bFhYWtmnTpkePHi1btkxXV5drZmFhceDAgbq6uob9b93KfviBMcaCgti8eczWlrm4MC0ttnAhy8pqQX137jATE/bkCWOM1dSwt99mp0934OEDtARiFNpOKBSOHz+eS8kBAwaMHTuWiLZs2WJkZEREmpqaampqGhoafn5+I0aM4JoZGRmFhIRUVVVxPchiVCxmFhbMxoZNmsSIGBHj89mMGSwh4dV//rvv2KVLLDycWVqyqVOZldUffQF0LcQotNf58+fffPNNLiV5PF5wcPDly5ddXV1lZzx8Pv+nn346cODA6NGjuS36+vqBgYHPnj2LiWE//cQyMphYzC5fZv7+jDGWmso++YSpqv6Rp2+8wQ4dKqmpqfmfv5qSwng81qcPe/SIJSay0lImlcrl8AEQo9AxLly48Pbbb6uoqGhoaJw9e5Yx1ihMJ0yYkJmZeerUKdnVAC0traVLl3p7PydiGzc27vDxYxYUxAwNGRF7882F+vr6/v7++fn53K+XfH2lWlrMz4/94x+MiC1f3sXHCyCDGIUOU19f7+PjQ0QqKionTpzgNmZkZFhZWRER0WAe7/9cXV2Tk5PPnj076cXTnXy+so6OrVB4/aV91tSwAwekEyY4co1VVFS8vLz27dtHRJaGhhUFBZIRIxgRi4rqwgMF+B+IUehIUqn066+/5k7k9+zZI9seGLiNz68kYkSreTyeq6trUlJSamqqh4eHiopK//79p0+f3ujuUyMXL16cNWsWn8+XDW/nzJmzefPmkTo6qV5eOKMHOUKMQscLCgrirpNu3rxZtvHgQaaszIiYispOIt62bdu47TExMf369SMiT0/PppOUMVZYWBgYGKijo0NELi4umpqaRBQTE9OJBwPQHMQodIqQkBAej0dEGzfukm08fpypqDAiZmeXWllZJduekpKira1NRB4eHs0mKWPs+fPn3377rZKSEp/P//DDDzvlAABaDDEKnSUsLMzEZLSeXtH//d9/z7ljYpi6Olu6tHHjlJQUbozp7u7ekiRljPn7+xORoaFhSUlJhxYO0DqIUehEJ0+KueGntzerr/9j42+/vfxKZmpqaquStK6uzsHBgYhmzpzZoVUDtA6+xQSdKz6ePviAKiroww/p2DFSVW2qcVpamrOzc2lpqbu7+9GjR5WVm5mB7MGDB9bW1qWlpTt37vz88887sm6AFkOMQqdLSqKpU6m0lKZOpZMnSV29qcYNk/TIkSMCgaDpziMiIjw8PNTU1BITE8eMGdORdQO0DKYmgU43bhzFxZG+PsXG0uTJJBI11djGxkYoFOro6ERERMybN6+urq7pzt3d3b29vWtqaubNm9doximAroHRKHSRrCxydqbKSvr0U7KwIG9vIqJff6XiYpo7t3HjVo1Ja2pq7O3tb9y44ePjs2vXrk47AoCXw2gUuoiZGV2+TLGxlJtLa9bQ778TEd29S7duvaRxwzHp3Llzmx6TqqmpHTlyRF1dfffu3UePHu2c8gFeCTEKXcfIiOztiYi++oqWLGmmsY2NTVxcnI6OzsmTJ5tNUgsLC+7TpIsXL87Ly+uwigFaADEKcvD++6SuTsePN9PM2tq65Unq6+s7Z84ckUg0Z86cZq+oAnQgxCjIx9attHYtcRPnnz9PL2bQb6xhknJvizbR588//zxs2LDk5OTAwMC2VZWamtrwssA333xTU1PTtq6g90CMgnwMHUrz59M//kEiEbm5kZERBQfTSyPL2tpaKBQOGDDgl19+aTpJ+/fvf+jQIWVl5eDgYKFQ2IaqcnNzL168KFsNCwurra1tQz/QqyBGQW6WLyc1NRKL6Y03qKSEAgLIzIz276f//WgTMcYCAwNnzpypra39yy+/zJ49u7q6+lV9Ojo6rl27ViqVenl5FTX8TFMLBAcHY+wJbSHfl6igF8rNZZWVfywXFrKCAiaVsn/9i73++h/T3ZuZsX/9q0j64o3RkJAQItLX1z979qxAIDAxMTExMUl49ddFJBKJk5MTEU2ZMkXamgn0pkyZsmzZMhMTk9kvaGhoiESidhwr9AqIUVAUEgkLD2empozHk1pYjHv99dfDw8MzMzPV1dWJKCoqaunSpUSkqqpKRHw+f8WKFbJvOjVSUFDAfUpv06ZNTfxFkUgUFxcnW925c6ejo+NHH31074VBgwYhRqFZiFFQLLW17MCBvMGDB3NnSw4ODtOnT/f29hYKhTweTyAQXLt2LSgoSEVFhYiMjY1fNSyNiYmRtX/V3yoqKtLW1haLxdxqYWFhnz59fHx8ZA2GDBmCGIVmIUZBEVVVVW3atEn2cWYnJ6fXXnuNiL7//nuuQUZGhrW1NRHxeLyFCxdWVFT8uRNu9GpiYtIwCquqqoqLi2Wr48ePFwqFstURI0a4urrKVhGj0BKIUVBcFRUVQUFB/fv3JyI1NTVjY+N62XR7jNXW1jYcll64cKHR7jU1NVzUzp49W7YxODjY19dXthoSErJr138nlv73v/+dlJQkWxUKhS2c/BR6M8QoKLqSkpIlS5Zwk+b97W9/a/RrRkaGjY2NbFj6/Pnzhr9mZ2draGhoaGjk5uZyW/Ly8sLDw7uodOgdEKPQPYSFhXFJ6u/v3+j+e8Nh6fDhw+Pj4xv+OnDgQB6Pt3r16q6tF3oRPDcK3cPHH398+PBhgUDAnZVLpVLZTwKBwN/fPzk52cbGJi8vz8nJadGiRRUVFUSUk5PDXQk1NzeXX+3Q08k7xwFaITo6mnv+ad68ebW1tY1+raurazQsXbx4Mffv/P79+3IpGHoDzDcK3cylS5fc3NzKy8vd3NzCw8PV1NQaNUhPT58/f35GRoaSkpKSklJ9fX3//v2fPXsml2qhN8BJPXQzb7311q+//qqrq3v69Olp06ZxJ+8NWVtbp6SkBAUF8fl8DQ0NbsucOXPkUSz0ChiNQreUmZnp7Oz88OHDcePGxcbGcp8UbeQ///mPs7Pz8+fPzc3NL168KHsKFaBjYTQK3ZK5uXlCQsLQoUPz8/MXL14sevGBp3Pnzu3Zs4dbtre3t7e3J6LMzMzNmze3sOdbt275+PjIVhcsWJCVldWhtUNPgxiF7srU1PTy5ctCoTA9PV0sFnMb8/PzG6be3bt3iUhFRSUoKGjr1q0t6ba6uvrevXuy1Xv37jUxoRQAIUahWxs6dKiFhcWrfi0vL8/Ly1NTUwsNDeXxeMuXL4+IiOjK8qCXUJZ3AQAdwMXFhXs4v7i4eMaMGdzG9PR0xpilpeXHH39cUFCwatWqjz76SFtbm5tGrwnJyckODg7ccmZmZqdWDj0AYhR6gujoaH19fSLas2eP7KT++vXrRPTGG28QUUBAQFFR0datW2fNmnXp0iUrK6smerOzs5NNnv/uu+92bunQ/eGkHnqshjFKRFu2bHF3dxeJRNOmTXvw4IFcS4MeBTEKPVajGFVSUgoLC3vzzTcLCwu9vb1fuktaWlrD10wBWgLPjUK3l5WVNWLECO7aaGlpqVgsNjAwqK2t7du3b319vUgk0tTUlDV+9uzZggULPDw8KioqFi5cyG38y1/+smvXrqSkJGdn52nTpoWGhnKz8xFRRUWFuro6n8/v+uOC7gKjUej2zMzMuAwlIh0dHQMDAyK6fft2bW2tqalpwwwlIm1t7cjISIlEcvPmTdnG8+fP5+bmzpw5s6amRldXV5ahRKSpqYkMhaYhRqFnanRG3zSpVDpjxownT564uLjs2LGjk0uDngZ36qFnajZGT548mZ6eTkRSqbS4uPjx48e2trbHjx+XDWwBWgijUeiZmo3RmTNnXrx4MSEhwcjIiDE2bNiwM2fO9OnTpwtrhB4C//FCD8QYy8jIoCZjlMfj8fn8r7/++ujRozweLyIigvtqHkBrYTQKPVBaWppIJNLQ0IiMjLx27VplZeVLm+3evXvz5s0CgUBbW7uJl0oBmoYHnqCnqaqqcnJyys3Nffr0qWyjgYGB7Qvjxo0TCASnT5/29vaWSCT79u2zsbF5/fXXeTyeHMuG7gsxCj2KRCLx8PCIjIw0MDD4/PPP7927d/369Vu3btXV1TVsNnjw4JKSErFYvG7durVr18qrWugZEKPQczDGfHx8QkNDdXV1L1++bGZmxm2vr6/Pzs5OTU1NTU3NzMxMS0srLS0dNmyYra1tREQEBqHQTohR6DlWr179ww8/aGhoCIXCCRMmvKqZVCq1sLDIysq6cuXKxIkTu7JC6JEQo9BD7Ny509fXVyAQREVFTZ069c8NampqPDw8xo0bt2LFin79+jHGRCIRnnCC9sOdeugJoqKivvjiCx6P989//pPLULFYvHHjxoaXRNPT08+cOXPixIm0tLT6+npLS0tkKHQIxCh0ewkJCZ6enhKJJDg4eP78+UQklUo//fRTPz8/2eQjRJSUlERE48aNky3Iq2DoYRCj0L3dvHlzxowZNTU1vr6+K1eu5DauWLHi+PHjWlpaS5culbVMTk4mIjs7O9mCXAqGngcxCt1YXl7e5MmTy8rKPD09t23bxm384YcfQkJCVFRUIiIirK2tZY25QaidnR1Go9CxcIsJuquSkhJHR8fs7Ox33nknNjZWVVWViA4dOvTJJ5/weLxjx455eHjIGpeVleno6Kiqqubl5Q0aNEhdXV0kEmEWEugQ+GcE3VJVVdX06dOzs7OtrKwiIyO5DI2Ojp4/fz5j7O9//3vDDCWipKQkxpiNjU1aWhpjzNbWFhkKHQUn9aAo7t+/f+vWLdlqTEzMq1rW1dW5u7tfu3bN2Nj43Llz/fr1I6KkpKQ5c+bU19d/++23X375ZaNdcH8JOg9iFBRFXFzc/v37ZateXl4v/SwSY2zhwoWxsbF6enqxsbHctEx37txxc3OrrKz08vJav379n/fC/SXoPIhR6Gb8/Pz279/ft2/f2NjYkSNHEtHDhw+dnZ2Li4tdXV337t370pc7ZemZkpJCGI1Ch8LlIVAgt27d2rt3L7csFouvXLmirKw8atSoAQMGcBt37NixadMmgUBw4sQJW1tbIiovL3dxcbl37569vf2xY8deesUzPz//0aNHOjo6fD6/uLhYT09v+PDhXXZQ0OMhRkGBMMYkEolsdc2aNZcuXSIiXV1dMzMzNTW1+Ph4JSWlAwcOTJ48mYhqamrc3NyuX79ubm4eExPzqreSZI86cWNSDEWhYyFGQYFYWlr6+PhwywEBAVZWVlVVVdnZ2SUlJVeuXCGiQYMGLVu2bO7cuVwbf3//S5cuGRoanj17VkdH51XdFhcX9+nTZ+zYsbgwCp0B10ZBcW3dujU5Obm8vLygoODw4cNEJBaLZa8qEdHq1audnJzOnj07ZMiQJvpZvHixSCQKCAiQDUs7u3LoVRCjoCjMzc0bTlvn7e0tu1k0ePBgFRUV+tP5+MCBA+Pi4lry/Q8+n6+urp6WlkZEY8eOlW1ftmwZF9BEVFhY2MIPMgM0hJN6UBQODg4NV4ODgxuupqam0v8mYGslJCRUVlZqampu377d1NR05MiRI0aMkEqlsseqGl2ZBWghxCh0D1yMcnfn26C8vHz58uW6urolJSUbNmyQbZ8+fbqlpWV5eTkRVVRUdEip0NsgRqEbYIxx5+Nti9G6urrZs2ffuHHDyMho3bp1RUVFuS/069dv27ZtERERRCQWizu4bugdEKPQDeTl5T19+nTgwIGGhoat3ZcxtmjRonPnzunp6QmFwhEjRjT8denSpStXrvTy8iKigoKCl06bD9A03GKCboB79ahtd9i/++67ffv2aWhonDp1qlGGAnQIxCh0A22+MLp3797169fz+fwjR46MHz/+zw20tLTU1dW5ZT6fr6ur285SoRfCfKPQDTg5OcXHx586dcrNza3le8XHx0+dOrW2tnb79u1LlizpvPKgl0OMgqJjjOno6JSVlT18+NDAwKCFe926dcvR0VEkEn3zzTd//etfO7VC6OUQo6DocnNzR44cOWjQoMLCwhbuUlhY6ODgkJ+f7+npeeTIkZfO+QTQUXBtFBRdax+8Ly8vnzZtWn5+/qRJk/bv348Mhc6GGAVF16r7S3V1dbNmzbpx44a5ubns4yIAnQoxCoqOe9rJ1ta22QtQjLHPPvssLi5u0KBBsbGx2traXVIg9HZ4/B4UGmMsPT2dW+jXr5+VlZWtra2tra2jo6OxsXGjxqtWrQoLC+vbt290dPTQoUPlUS/0RohRUGg5OTkikWjIkCEPHz58/vz51atXr169yv00ePBgOzu71atXc4/l7969Ozg4WCAQREREYKIm6EqIUVBo3Oz3enp6jo6OBQUFaWlpqampqampiYmJhYWFhYWFfn5+RBQdHe3r68vj8Xbt2vX+++/Lu2roXfDAEyiuJ0+e2Nvb19fX5+fnE5GmpuaYMWO4k3obGxtlZeXk5GQPD4/bt29PmjSpsrJy/fr1a9askXfV0OsgRkFBiUSit99++/r168bGxlZWVmlpaQ8ePGjYYODAgXZ2dqampmFhYSUlJQsWLAgNDZVXtdCbIUZBEVVXV0+ZMuXSpUumpqaXL18eOHAgEZWVlaWkpFy5ciU1NTUpKam4uJhrrK+vb25ufu7cOW6GfIAuhhgFhVNXVzdjxozo6GhDQ8MrV64MGzbspc1+//335OTkBQsWVFdXZ2VljRo1qovrBODgFhMoFsbYwoULo6OjdXV1z58//6oMJSITExNVVdXq6uoBAwYgQ0GO8Pg9KJbly5fv379fS0srNjZ29OjRTTfOyMggIjzeBPKFGAUFsnbt2pCQEBUVlYiIiJa8RH/9+nUiGjNmTOeXBvBKiFFQFDt27NiwYQM3xbKzs3NLduFGo4hRkC/EKCiEyMjIL774gsfjhYaGzpo1q4V7IUZBESBGQT62bt16584dbjknJyc3N3fChAkbN2789NNPW9hDVVXV77//LhAImr2ECtCpcKce5EMoFI4dO5b7xlxRUdHVq1cvXLggEAha3sPNmzclEomFhQUeFwX5wmgUFEWrMpRwRg8KA6NRkJtVq1bp6OgQ0dOnT7mFVkGMgoJAjILc+Pn5cXPcJSYm7t27t7W7I0ZBQSBGQW60tbW5l+XbME09Y+zmzZtEZGVl1fGVAbQGro1Ct5SXl1deXm5gYKCvr09EoaGh0dHR8i4KeimMRkE+NmzYMHz4cG7Z0tLyu+++a9Xu3PtLstdAc3Nz6+vrO7RAgJZCjIJ8WFtby5a1tbVbe16PC6OgOHBSD90SF6MnT550cHBwcHAICwuTd0XQe2E0Ct0SF6NRUVHcK0wBAQHyrgh6L4xGofspLy+/f/8+j8czNTWVdy0AiFHoburr63fu3MkYU1JSUlbG6RTIHz4iAt3G7du3w8LCDhw4UFRUpKurW1VVlZWVNWTIECJ68uSJQCDo37+/vGuE3ggxCoouPz//8OHDhw4dun37NrfFzMyMiLKysqytra9cuaKhoSHXAqG3Q4yCPEkkEiUlJR6PR0SMMalUyufzuZ+qq6vPnDlz8ODBs2fPcs+Eamtre3h4eHl5TZw48dmzZ/b29nfu3HF3dw8PD+d6AJAPBiA/Tk5OycnJ3PL58+c9PDwkEolQKPTy8tLU1OT+iaqqqrq6uoaHh9fW1jbcNzMzU0tLi4h+/PFHedQO8AdcoQcFIhaLBw8eXFRURERKSkqTJk3y8vJyd3fv16/fnxuPHj364MGDM2fODAgIMDc3d3Fx6fJ6AYhwpx7k7tmzZ8XFxcXFxWVlZaqqqvr6+mZmZoGBgTk5OQkJCZ999tlLM5TzwQcfrF27ViqVzps3LzMzsyvLBpDBtVGQp/fee6+uro67w/7kyRNDQ8OffvpJV1e35T0wxjw9PcPDw0eNGpWYmIib9dD1MBoFOdu8eXNUVFRUVNS6deuIqFUZSkTcV/AsLS2zs7M9PT0lEknnlAnwSohR6PY0NTVPnTqlp6d37ty5NWvWyLsc6HUQoyBPAwcOVFVV5ZbV1dX19PTa1o+RkdGxY8eUlZWvXr1aV1fXcQUCNA/XRqHniI+PNzAwCAsL+/7777ktq1at8vb2NjExkW9h0LNhNAo9x7vvvltVVZWUlCTbkpSUJBKJ5FgS9AaIUQCAdsHj99DTpKSkODg4cMt4mBS6AGIUepqxY8fGxcVxy05OTvItBnoDnNQDALQLYhQAoF3wwBP0KNXV1Y8ePTI2NuZW7969a2BgoK6uLt+qoGdDjAIAtAtO6gEA2gUxCgDQLohRAIB2QYwCALQLYhQAoF3+H2x+Ckz2JN34AAACXnpUWHRyZGtpdFBLTCByZGtpdCAyMDIxLjAzLjIAAHice79v7T0GIOABYkYGCJADYgUgbmBkA9MsbA4aQIqZeFphAYhmJKiOQQVkLRIfQrND+MzsCitANBMjB0SCiRFMMzLSiuZmEGJgFGVg4sxgYhYHeiCDiYULiJkSWCUZWHkzmNhYE9h5GDi4M5g4GRM4GRi4mBO4eRO42Rl4ZFmYePgYeLgYeAUU+AQ1mPjZMpj4ORIE+BSEGRhEGBjEmBgkWBik2Bik2RlkOBhEmNkYOYGGM7OxsvFzcPOysXPzCvDxiDPCokFu6d75DhXcKw5YpDc4/I457CC01PHAOvdEh3OrJjrYzq488OXvF/uIU6ccXH593R/wR8dh/tkZDkbPjA6oPem29/1s5hB9eY79tpYn+zu+GAPF4+z95dwO1NrvdOg/FLp/Q1HEfhu/qQ5u2z7vE7ngcMDj4TIHf4fGA8tfeDj8WbnV4dOlp/uz9uyxTzSa7SBZHL7vlvSZ/W/09zoEefLun/hWxl61tMphXpyl/QKp/P3HvRc6OH5Utmd53mP/6VKuA8/klTZLdfIPHNlY58DP3WvPlbHILqB3pYPPskn29uHcDgqXljosvLbgwHrVRQ6eelsdFJIPAdXmAe2sdej+u/mAsXE1kL7scLLM7cAOuX4HL54yBzObqQf+tp+xX9D5wEH59sT9KWccHZZXtjt8aNU9oLtJ1u5aGAfQ/Z/t725ds5/9HKPDhAUL7O9Nzj8QVnvOIVXy1P74GUv2S7KscYg4NWl/hlLCgTjvew6HL2fv69XwtRcDALF2x6dRi6LQAAAC13pUWHRNT0wgcmRraXQgMjAyMS4wMy4yAAB4nJVW224UMQx936/ID5C1HTtOHqGLhIQol4fyiNpSCQRVgbYS8PU4iWcY0FZVRqPdnEl8xjm+TPZnN1/vr69u92/uL04+XV2/PTmc350/O7+9en/z48v+2/3FpT39fkmA+tFmLmxm//PX7z349aH9VLv2EO35LrTr3eHl57uwXumw24UEIVEI0G9cBn6bfTgjY+r2HGvFaoMnEkmQxzNAyuEk/Gd59O4sOSIINpYUgUS7J1HsLTMsHEXIWSpAGwWMFXmKJceUlBqL2RJ2XygqUJ3zRXXsyGyrpOEL1DkWikVKHrZE4l5pMb45FsTSRhCLgrrOVaZiJPbeCs3WWJIsIxY5xpIe1CVnKcOWNYP7gqRzvhAODyzXUsWRL5gqzbFkVXBNq+2j68zKR3f0cKQL1zp2RAg8+KTypLoVR+6CZXGvKItWxrTNXXqMxfIeEw9bJXa+muYqQCIwiHvAfUemCwKUGZYUFXt8jQVoyTpNiuF0hqVqzYsHiy4JrUKPsBwRaMmXWjy+yOI1jWosr2d0wbL0OqBMrlW2Hb2Yyro8WHIE5exake1ygsV0yaN6jI/YO2Ylq4oJlrzYWmRMXRj5zEoy50thllGNOSePlljgZljUukAuo3qskmUwA5UpdTlS6h60vouYRr6g8JQulhsJvGfbl8RrOnFNcyzmPXn3Fq5eAWwVOhUjFnJdxFrwGFGRKXUlJu0drqnLQ2f7wgJNqZujtTX1XucK2TcAcGJHGFr24wAUiFaQQstAHoAD8TrDvbR9RgLiBrRPjYMc7Nix2OTQTiM+ow0voISWF76sBlyp2+v/Abgs8zf6DG2om3VZl6V2dmogd4CymcG/bBzaucKB7aeM1mUgd195BXUFumGjrW+EW5C6IA6kC+RAO7WDsvHaziRhCckrOxE+PXR32oL2349A1Gaenx52fwBQFbAlH7LgzwAAAcZ6VFh0U01JTEVTIHJka2l0IDIwMjEuMDMuMgAAeJxdkr1qXDEQhV8l5RquxfyPxkvAsI2rJEVIs2zALO5srwku/fA5o02RpLmDPh0dnRnd48PpeDjxWc6748Pp5vVa/nzl+OV02H3+enM83N+f+Ar5H8nusOr6/IUZ308fuxjmMrdbHp6zusr02vtYKxpTfRVz3xtKLSpMts6UBXCEz8aWsd3qIJaEg6Z7i9hiNnYS3utIjo0GCWXD1OS9jMk8QWdeKZUHKMmUDYncamlNrbU+o6m4tH1OV1BWUtCiazK1UlxWrAbfFOMOWDAAzGoDJi7sKacgLRk5VmE433s0AaWm98o8N1yRS1ksy8x9nQ/WfQwMItdkOgYaITZII3NFLG8bS+shZjrOS9NOTCUFKqqxKHMbsBuge1+l3RV3c9zxpxnm2lPXbsPRTkflBUmLN8U0SnC+ChFvselsm/XDBKQ8r5QkZEMJPAGyRtMYlBZwSKnoWUW0NMQSsMTRK5OvVCTe0AVsCcAwVFxkuYSquZ6ohHt+Seg0kSLWD4eMvrXL5JvtJ9+hQ94e3y8v335d3u54vFyev1/efzw+P72en4be8f9IPn4Dn1isShuZbd4AAAAASUVORK5CYII=",
      "text/plain": [
       "<rdkit.Chem.rdchem.Mol at 0x7f3f816ead60>"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "print(\"num graph nodes\", graph_contacts[0][\"num_nodes\"])\n",
    "print(\"num atoms no Hs\", RemoveHs(mols[0]).GetNumAtoms())\n",
    "print(\"num atoms\", mols[0].GetNumAtoms())\n",
    "mols[0]"
   ]
  }
 ],
 "metadata": {
  "interpreter": {
   "hash": "906fb3602c4d49c4c01ec4a34d5abe4c7af3a32cf71a93ee4914804593d051b0"
  },
  "kernelspec": {
   "display_name": "Python 3.9.9 ('gtblueprint')",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.10"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
