{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "/home/philippe/Distill/mol-distill\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/philippe/.conda/envs/mol-distill/lib/python3.10/site-packages/IPython/core/magics/osm.py:417: UserWarning: This is now an optional IPython functionality, setting dhist requires you to install the `pickleshare` library.\n",
      "  self.shell.db['dhist'] = compress_dhist(dhist)[-100:]\n"
     ]
    }
   ],
   "source": [
    "%cd ../.."
   ],
   "metadata": {
    "collapsed": false,
    "ExecuteTime": {
     "end_time": "2024-09-19T13:22:01.914442137Z",
     "start_time": "2024-09-19T13:22:01.867181920Z"
    }
   }
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "collapsed": true,
    "ExecuteTime": {
     "end_time": "2024-09-19T13:22:28.700583471Z",
     "start_time": "2024-09-19T13:22:28.317804497Z"
    }
   },
   "outputs": [],
   "source": [
    "import os.path\n",
    "\n",
    "import pandas as pd\n",
    "\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "\n",
    "from tdc.single_pred import ADME"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Found local copy...\n",
      "Loading...\n",
      "Done!\n"
     ]
    }
   ],
   "source": [
    "data = ADME(name = 'Caco2_Wang')"
   ],
   "metadata": {
    "collapsed": false,
    "ExecuteTime": {
     "end_time": "2024-09-19T13:22:38.032602050Z",
     "start_time": "2024-09-19T13:22:37.990371806Z"
    }
   }
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "outputs": [],
   "source": [
    "df = data.get_data()"
   ],
   "metadata": {
    "collapsed": false,
    "ExecuteTime": {
     "end_time": "2024-09-19T13:22:49.672071202Z",
     "start_time": "2024-09-19T13:22:49.669387416Z"
    }
   }
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "outputs": [],
   "source": [],
   "metadata": {
    "collapsed": false,
    "ExecuteTime": {
     "end_time": "2024-09-19T13:23:40.933463377Z",
     "start_time": "2024-09-19T13:23:40.928100613Z"
    }
   }
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "N=C(N)c1cccc(CC(CC(=O)N2CCCC(C(=O)O)C2)NS(=O)(=O)c2ccc3ccccc3c2)c1\n",
      "C[C@@H]1NC(=O)[C@@H](C)NC(=O)[C@H](C)NC(=O)[C@@H](C)NC(=O)[C@@H](C)N(C)C(=O)[C@H](C)NC1=O\n",
      "COC(=O)c1c(Cl)cc(Cl)cc1-c1ccc([C@@H](C)NC(=O)C2(NC(=O)C(F)(F)F)CC2)c(F)c1\n",
      "COCN1C(=O)NC(=O)C(c2ccccc2)(c2ccccc2)C1=O\n",
      "CCOc1cccc(NC(=O)OCCN2CCCC2)c1\n"
     ]
    },
    {
     "data": {
      "text/plain": "<rdkit.Chem.rdchem.Mol at 0x7f3f73b06dc0>",
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAIAAADCEh9HAAAABmJLR0QA/wD/AP+gvaeTAAAf8ElEQVR4nO3de1zOd/8H8FcHV0o6i0KanJZQCiVkKOQwlsthWzbbLdu4M8Mv95gwtzls1Ox+jId7c1gOcznccmYsyzmhVCjHRBjpQF2lrvfvj2+7VGLVdfheV9f7+fDHvh9X1+d9tXr5Hj4HIyICY4yxujIWuwDGGNNvHKOMMaYSjlHGGFMJxyhjjKmEY5QxxlTCMcoYYyrhGGW1k56O5csrtezejT17RKqGMR3AMcpqJz0d331XqYVjlBk4jlHdlZub++eff4pdBWPsb3CM6hy5XL579+5BgwbZ2dk5Ojr6+PiUlpaKXRRj7JVMxS6AlZPL5QcOHJDJZLt37y4oKFC2JyYmjhs3LiYmxszMTMTyKnr0CAEBLw4zMjB8uHjVMCY2jlGRyeXyw4cPy2SyXbt25efnC43u7u5SqXTQoEFnzpyZO3futm3b7t69u3v3bnt7e3GrFVhZYeHCF4fLlolXCmM6gGNUHK9Jz3fffbddu3ZCi6+vb//+/YODg0+dOtWnT5/9+/e7uLiIV3U5iQS9e784/OUX8UphTAdwjGpVDdOzIg8Pj9OnTwcHByclJfn6+u7bt8/T01O7VTPGXodjVBtqlZ6PHj3auXOnTCZbu3Zt8+bNATg7O8fFxY0YMeLYsWO9e/fetm3bwIEDRfgYjLFqEdOYoqKi2NjY0NBQKysr5Tfc3d09MjLy6tWrVV78+PHj9evXDx06tEGDBsIro6KiKr5ALpePHTsWgEQi2bhxoxY/RyX379PBg5VaLl6kpCSRqmFMB3CMqt9r0jM9Pb3Ki19OTxMTE39//6ioqAcPHlR5sUKhiIiIAGBkZBQZGamlz1PZlSvk7U0bNrxomTGD1qwRpRbGdALHqNpoLj2riIqKMjY2BvDPf/6zrKxMYx+oeufPk4kJNWlCyjLfeYcWLNByFYzpEI5RNYiJiWnVqlWjRo2U6dmtW7elS5feuHGjyitVSc+Ktm/f3rBhQwAjRowoLCxU66f5G+fPk6UlffghjR9f3sIxygwcx6iqzp07Z2pqqrlzz1c5efKkMIzU19f3zz//VPlz1JQQo/fuUePG9PvvRByjzODxk3pVxcTElJaWWlhYHDp0yN/fv+Jf5eTk7NmzRyaTHTx48Pnz5/grPaVS6bhx4xwdHVXp18/P748//hg8ePDp06eFIaWtWrVS6ZPUhpMTIiPx6adIStJan4zpKI5RVQmnohMmTFBmqEbTsyJ3d3dhSOnFixd9fX337t3btWtXdb15RQoF4uMhk8HGBiEh5Y1Tp+KXXxAdrYkOGdMrYp8O672AgAAAe/fuFQ6PHj2qvMaXSCTBwcFr167NycnRXAEFBQXCMFJLS8t9+/ap8Z3Lyig+nsLDydmZAALIwYESEsjSsvwFf/xB1tbUqxdf1DODxjGqkrKyMuG5vPIW57Nnz6ysrIT7ng8fPtROGcXFxe+++y4AU1PTNSoPPno5PQFq1YrCwyk+nhITX8QoEX3wAQG0YAEpFKTFO7SM6RCOUZWkpaUBcHFxqdhYVFSk/UoUCkVkZCRUGFL6+vRUKMpfJjxiUnr0iOztacECmjOHnJ3pwgU1fBbG9AvHqErWr18PICQkROxCyn3//ffCkNKPPvro+fPnNfmSsrKyuLi48PDpLi4KZXq6udGsWZSYWNN+i4upd28CyMam/PE9Y4aDY1Ql4eHhAL755huxC3lh586d5ubmAN5+++1nz5696mVlZWXx8fHh4eHOzs7Cndxu3e6/fO5Zc3I5jR1LAEkkJN5U1QpKSqi0VOwimEHgGFWJn58fgMOHD4tdSCWnTp1ycHAA0L179yr3Z4Vzz8mTJzdr1kz5mNHNzW3WrFkXLlSdLFBbCgX93/8RQEZGJNJUVSIi2ryZ3N3J1JRMTKhHD4qLE68UZhA4RutOGC5qZGT0+PFjsWupKi0tTRhG6ubmlp6e/vK5J4BWrVqFh4fHx8cr6nDy+WpRUWRsTACFh5PWp6oSyWRkaUmbNlFREeXn07Jl1LBhLW5PMFZ7RkSk4SFV9VZSUpKnp2ebNm0yMjLErqUa9+7dGzJkyMWLF62trc3MzB4+fCi0u7m5SaVSqVSqoUGmALZvx/vvQy7HyJHYuBHm5hrqpzpeXhg+HPPnv2gZPRomJti8WYtFMMPCW9rVXUJCAoBu3bqJXUj1nJ2d4+Pju3btamlp+fDhQ+W5Z0ZGxjfffKO5DAUQEoL9+2Fjg5070a8fHj3SXFeVlZUhLQ1BQZUag4KQnKytCpgh4hitu8TERAA+Pj5iF1JJWVmZ8r8tLS29vLzu3r07ffr0W7duRUdH9+rVy8jISAtl9O2L48fh4oLTpxEQgNu3tdAnkJODkhI4OFRqdHREdrZWumcGimO07oSzUV2L0S+++MLV1XXHjh3C4fnz5wGMHDlS+5V07Ijjx+HhgfT00rCwj5M1d0qYnIyvvkJEBBwcYG6O+/cr/e29e9CBDaxYPcYxWkclJSUpKSnGxsZeXl5i11JJQkLC7du3ra2tAcjl8pSUFBMTE7G2b2rZEvHxGD8++tChn3v37n3kyBF1vntqKubNg7s7unTBwoX44QcUFsLTE7t2VXpZbCy8vdXZL2NViP2MS1+dPXsWgLu7u9iFVPL8+XNzc3MjI6MnT54Q0alTpwB06tRJ3KqUc1UlEskvv/yi6tslJdGcOdS+/Yu5Vk2a0KRJ9NtvVFpKhw6RhQWtXEkPH1JmJv3rX9S4Mb20dCFjasQrPNWRbj5fSklJKSoqatu2rY2NDYBz585BB247SCSSmJiYtm3bzp8/f/z48deuXZs3b16t3yU1FTIZtm7F5cvlLXZ2GDIEUikGDcJfC7kiMBD/+x8WLMCsWTA1Ra9eOH4cbduCCDNm4KOP0LGjuj4XYwKO0TrSkYSqokpVulOkkZHRvHnz7Ozspk2bNn/+/Lt37/7444/KpbBeIzk5WSaTjU1L6/jX3V44OmLkSEil6NsXJibVfE1gIAIDqzauWoXly/Hzz/jf/xAQoOLHYawSsU+H9VWnTp0AnDp1SuxCKpk0aRKA7777Tjh0d3cHcPbsWXGrqmjHjh01mauakpISGRnZoUMH4af0c09PsrOj0FCKjaWSkrp0LJfTmDHlk1U3bar7B2DsJRyjdfHs2TNTU1NTU1Mt74P0t7y9vQH88ccfRFRQUGBiYiKRSORyudh1VaKcq9qjR48qc1WTkpLmzJnTvn175T/zjo6On3zyye9HjqhhgrxCQTNn6sBkVVbfcIzWxfHjxwF4enqKXUglcrnczMzM2Ng4Pz+fiI4dOwbA29tb7LqqkZqaamtrC8DFxSUjI0M493zzzTeV6WlnZxcaGhobG1tSt3PP1xB5siqrh/jeaF3o5vOlpKSk4uLijh07Nm7cGLpapMDd3d3BweHJkyeZmZlvvvlmaWmp0O7o6Dhy5EipVNq3b1+Tau97qm7qVLRogfffx/ff484drU9WZfUQjxutC915dFNRlap0c5KV4OnTp9evX5dIJB06dCgtLRX2pu7YsWNWVtaqVav69++vqQwVhIRg3z5YW2PnTvTvr8XJqgBw69atESNGdO/efebMmdrsl2kOx2hd6EWM6uYkK0FiYqJCoejSpcvly5evXLkyY8YMAEFBQcoNqDXurbdw4gRatsSpUwgIQGampjvMysoSJuO2bt16165dCQkJ33777axZs4jXBtJ/HKO1lp+fn5GR0bBhQw8PD7FrqUSIUeEqPi8v7/r16w0bNhQe1uuaihHfvn37ixcvQvuJ37EjTpxAx45IS4ueMkVDc1UzMzNXrFjRs2dPFxeXzz///MSJE+bm5n5+foMGDWrQoMGSJUtGjx4tl8s10TXTHrFvzuqfo0ePAujRo4fYhVQiDB5o0KCBMHjg8OHDAPz8/MSuq3pjxowB8NNPPwmHwiqo6aLMNXryZPdHHxkZGVlbWx85ckRd75qZmRkVFeXv769cCMbc3Hzo0KHr168XHgAS0W+//Sbsh/jWW2/l5uaqq2umfRyjtbZkyRIAkydPFruQSuLj4wF4eXkJh4sWLQIQHh4ublWv4ubmBiApKYmIsrOzAVhbW6t39eiaKy4uHjduHP6abaXKW9UkPStKTk5u0aIFAA8Pj8zMTFW6ZiLiJ/W1phc3RnWzSEFOTs6NGzcsLCyUswMA+Pj4aGcFv5dJJJKNGze2a9du/vz5oaGhGRkZtZ2reufOnR07dshkspMnTxIRAHNz8/79+0ul0nfeecfS0vJVX9ipU6f4+PjBgwenpKT4+vru27evS5cuKn4cJgKxc1z/vPHGGwAuXbqkbLl+/bqI9Qjee+89AKtXrxYOXVxcAKSlpYlbVbUOHjwIwN/fXzj86quvAAgPW8QVHR0t7Kv6j3/8oyb7qr7m3LOgoKDm/ebk5PTu3RuAra1tHO8cpYc4Rmvn2rVrAMzMzJS/Zhs3bmzQoMGPP/4obmHCzJ/z588TkbBfSOPGjct0cnj5v//9bwBTp04VDgcNGgRg27Zt4lYlUM5VHTFixKumqKkrPSuSy+WjR48WfrQ2b96swidgIuAYrZ1ly5YJP+vKlsjISOF3ad68eWJVlZuba2xs3LBhQ2HOz549ewD07dtXrHpeT1hDWrliXpMmTQDcunVL3KqUTp48We1cVU2kZ0WlpaWTJ08GYGxs/P33q1R/Q6Y1HKO1c+XKFeG3aNSoUaV/zfL+6aefhMWKPvzwQ/VPXqwBYTlk5eAB4dbejBkztF9JTbRs2RLAlStXiOjmzZsAmjRpInZRlaSmpgp3Rdzc3LZu3Tp79mzNpWcVUVFRZmaWXbs+4qmqeoRjtNYiIiKEUeIV1yiKjY21sLAAEBgYWO0zWY2qMnhg6NChALZs2aLlMmri/v37AKysrIQbDjKZDEBwcLDYdVWVlZXVuXPnik8RGjVqNGbMmG3btr1mYSq1kMnuSyQE0JgxpGOryrDqcYzWxenTp4VL0e7duyuv+86cOePo6AjAx8fn/v372qxHKpUCWLt2rXDo5OQEQBcefL3s4cGDOwMCFr/7rnAYEREBYO7cueJWVa28vDxPT8+GDRu2bt1627Zt2lzN68gRsrYmgHr2pEePtNYtqyOO0Tq6du1amzZthOs+5bjx69evt2vXDsAbb7whXLRqhzB4ICUlhYju3LkDwM7OTqxhmH8jMpIAmjlTOLr68ce/9ulzcu9ecYvSQZcuUcuWBJC7O92+LXY17LU4RusuOztbWN+zadOm586dExofPXrUs2dPIciOHz+uhTIeP35sZGRkYWEh3KsV9gQNCgrSQtd1MWQIAfTrr0RECgXZ2BBA9+6JXZYuunuXunQhgJyc6MIFsathr8Zz6uuuWbNmcXFxgwcPfvDgQUBAwN69ewHY29sfOnRo6NChOTk5AwYM2LZtm6bLEBa39/b2FlZF0uWB9wCQmAgAwvJ9GRnIzUXz5nByErco3eTsjLg4BAQgOxu9e+PgQY33WFhYGB8fv2zZsh49egQFBQk/S+zviZ3jeu/58+cTJ04EYGJiohz9Xlpa+sknnwiN//nPfzRawNdffw1g2rRpwmFQUBCAHTt2aLTTOsrMJIDs7Ei44RATQwCNGCF2WTpNLqexY8t3P9m4Uf3vf/fu3a1bt4aHh/v7+5uZmVUMB0dHR/X3Vx9xjKqBQqFQjh6NiIhQti9evFgYJRMeHq65O5V37tzZtGmTcFdBoVDY29sDuHPnjoa6U8n27QTQwIHlh9OmEUBffy1qTXpAoaCICLXtfpKfn3/kyJGFCxcOHTpUeFKqZGpq6uXl9dlnn33zzTfCxc2ePXvU8AHqO45RtVGOHp0wYYJy9OjatWuF0VHjx4/XwpBSYZJV06ZNNd1RHf3rXwTQ7Nnlh716EUAHDohak9747jsyNiYnJzp6lCIiKCvrxV8tXUopKa/8QoWCLl+mtWspLIw6d6ZOnXpWjM5mzZqNGDFi8eLFcXFxT58+VX7V8uXLAbi5uenaXl46iGNUnXbt2iWMHg0KClKOHj106JCwHlr//v3z8vI0WsCsWbOgq/svEREFBhJAO3cSEZWWUqNGBFDlXe3Ya/z6K50/T+vWEUAhIS/a27Qp/6Yq5edTfDwtXkxDh5KDAwEv/vTrF9GjR4/w8PBNmzbdvHnzVX09f/5c2P528eLFmvo89QXHqJopR49269btwYMHQmNCQkLTpk0BdOrUSUOX2ykpKZMmTRIuxAICAjTRhaoUCrK3J6D8POrSJQLojTfELkv/rFtHXbqQszMpL7iFGE1NpTVr6KOPyN29fNc+5Z8WLWjUKPruOzpxgoqKatrRb7/9BsDS0jKr4qkvewnHqPpdv369bdu2AFq3bn316lWh8caNG8LqIa6urpcvX1ZXX4mJibNmzRKW7xRYWVnp5sB7unaNAGrWrPxw7VoCaPRoUWvSS+vWUc+etG4dubiQcBUuxGjfvi9ys0ED8vam8HBav55U+XEQFkB477331FV8vcQxqhGPHj3y8/MDYG9vf+LECaHx8ePHvXr1AmBraytsJV9nwo7EFfdzt7e3Dw0NXblype7eydq8mQAaNqz8cPJkAmjJElFr0ktCjCoU5OdHwhNNIUa//ZbGjaOoKDp9moqL1dPX7du3LSwsjIyMjh07pp53rI84RjXl6dOnQ4YMAdCoUaPdu3cLjUVFRaNGjQJgZmb2qzAEvTZelZ6xsbE1WR9TZNOnE0Dz55cf9uhBAB09KmpNekmIUSK6cIHMzeny5WrujarR3LlzAXh5eSnX4mFVcIxqUGlp6aRJk4TRo8oFSSs2bt26tSbvo9/pqRQQQAAJ8z5LSsjcnIyM6MkTscvSP8oYJaLwcBoyRLMxWlhY6OrqCmDVKl6+r3ocoxq3ePFi5ZBS5ejRqKiotm3bKp9BVauepKdSWBi1a0fCoi2JiQRQ+/Zi16SXKsZoXh45OZFEosEYJaKtW7cCsLOze8QLpVSHY1QblKNHP/jgA+Xo0Vett/Zyejo4OOhxelbr4kUKCaEvvhC7Dr1UMUaJaOPGF6PINEeYHTdlyhTNdqOfjIio6vxQpgGHDx8OCQkpKCgYMGDA9u3bhZGkFaWmpspksi1btly9elVocXBwGDx4sFQqHTx4sDCwX489e4bVq3HsGIqL0aEDPvsM7dqJXZO+ys5GVlb5sgSC33+Hhwcqz0hSs7S0NE9PT4VCkZiYyPvuVSV2jhuQs2fPCkNKO3furByIZxDnnoWF5O1NPj60fj3t3EkTJ1KjRqSV5a/qsUWLKDiYDh/WXo/h4eEAevXqpaNrMIqHY1SrlKNHW7ZsGRYWVnG8p5OT0+TJk+Pi4nRzHzqVLF1KLi6Vhn1PmUJdu4pXUH0wYgQBtH279nrMy8tr1qwZdHVjBRHxRb225eTkBAcHJyUlyeVy1LMr91cZPhweHli06EVLUhK8vJCfj1fv4c5ez9cXZ87g5En4+Wmv0zVr1oSFhbVo0eLKlSuNGjXSXse6jdcb1TY7O7uZM2fK5XJXV9djx449ePBgw4YNw4YNq7cZCuDmTbRoUanF1RVEuHlTpILqg+xsANpeqfXjjz/u3r17VlaWcvwJA8eoKFJSUgCMGjWqT58+xsYG8L/AxgYFBZVa8vIAwNZWlHLqASI8eAAATZtqtV9jY+OoqCgjI6Nly5ZlZGRotW8dZgC/w7pH1xeoV7v27ZGQUKnlzBk0bgxnZ5EK0ns5OSguhq0tzM213bWfn19oaGhxcfHMmTO13beu4hgVQWJiIoBuFUes1G8TJyI2FrGx5Yd37iAyEp98AkM4E9cMUa7olZYuXWptbb1r1679+/eLU4GO4Z9jbcvKysrOzrazsxO28zQIPXrgv//Fhx+iUyf4+8PdHb6++PprscvSY+LGaNOmTWfPng1g6tSpxcXF4hShSzhGtS0hIQGAj4+PsL+IoRg/HnfvYtUqfP010tPx88+ovO0PqxVxYxTA1KlT27dvn5GRsXLlStGK0Bkco9pmcDdGlczN4e+Pfv14H1DViR6jEolECNAFCxbcu3dPtDp0A8eothlujDL1ET1GAQQGBg4fPrygoODLL78Usw4dwDGqVURkcM+XmAYIMdqsmchlrFixomHDhhs2bDh+/LjIpYiKY1Srbty48fjx46ZNm7aoMhydsdr480+CDsRo69atp0+fTkRTp05VKBQiVyMejlGtEq7o+VSUqSgrq72dXTtn51tiF4Ivv/zSxcXl/PnzEydOFLsW0XCMahXfGGVqkZ2dnZOT4eRkJ3YhsLCwGDZsGIAtW7aIXYto6u88bp005/LlYE/PltpcTILVOwUFBU+fPrWwsHh51VrtKysri4+PB2BpwKvMcIxqkUJhHR//Vn4+OncWuxSmx7KzswE46ca4sWnTpiUnJ1tYWKxbt07sWkTDMapFV68iPx8uLuI/GmD6THdidNGiRStXrjQ3Nz906JC/v7/Y5YiG741q0blzAMA3RplqdCRGN23aNGfOHGNj45iYGEPOUPDZqFZxjDJ10IUY/f333ydMmEBEUVFR77zzjoiV6AI+G9UijlGmDqLH6KVLl0aOHFlSUjJr1ixhgyYDxzGqLWVlSEqCkRG6dhW7FKbfxI3RrKys4ODgvLy8sWPHLqq4MYwB4xjVlpQUPHsGNzfY24tdCtNvIsZoTk5OYGBgVlZW3759161bZ1irlL0ax6i28BU9UxOxYlQul7/99ttXrlzx8PDYuXOnGS91+BeOUW3hGGVqIkqMKhSK999///jx4y1atNi3b5+NjY02e9dxHKPawjHK1KGkpKSoqAjAwIEDk5OTtdbvF198sX37dmtr63379rVs2VJr/eoFjlGtKCnBpUswNoaXl9ilMP0mkUhCQkIAnD9/vkuXLgMGDNi9e7emV1dasmRJdHS0RCLZsWNHp06dNNqXPjIiIrFrMAB//okpU5CXhwMHxC6F1QdHjx49cODAmjVrcnNzAbRu3TosLGzSpEmauNbesmXLe++9B+DXX38dNWqU2t+/HuAY1bzMTNy6BXt7vPkm74XJ1KigoGDz5s3Lly+/evUqgMaNG48bN27atGkdOnRQVxdxcXGDBg0qLi5esWLF559/rq63rW+Iac7DhxQYSFZW1L07NW9Orq4UHy92Tay+KSsri42NHTBggDD8yNjYeMCAAbGxsQqFQsV3vnTpknB6O2PGDLWUWl9xjGrSgAEUGEi5uURECgXNn082NnT/vthlsfrpwoULYWFh5ubmwhmSp6fn6tWrCwsL6/ZuWVlZwqOkMWPGlJWVqbfUeoYv6jXm+nW0aYP0dLRtW96iUMDdHZ9+iqlTRa2M1WcPHz5cu3btDz/8kJWVBcDR0XHChAlTpkyp1b41eXl5ffr0SU5ODggIOHjwIA8RfT2+VacxV67A1vZFhgIwNka3brh6VbyaWP3n6OgYERFx/fr1rVu3+vr6Pnz4cMmSJW5ubqNHjz59+nRN3qGkpCQkJCQ5Obljx448zL4mOEY1Q6FAQQEaNara3rgxcnPFKIgZFolEIpVKT506de7cudDQUIVCIZPJ/Pz8fHx8NmzYUFpa+qovJKKPP/74yJEjzZs337dvn62trTbL1lMco2p16xaio9GrF1asgKsr7t9HSUnVF7RuLVJxzBB5e3tv2LAhPT09IiLCzs4uMTHxgw8+aNWq1bx583Jycl5+/fTp02NiYqysrPbu3evi4qL9gvWS2Ddn64WMDFq0iLy8CCj/89Zb9OwZ2djQTz+9eNnt2ySR0KFD4hXKDFpBQcHq1avd3d2F331LS8uwsLDU1FTlC7799lsAEonk8OHDItapd/gRkwpu3cKuXZDJcPIkhG+jhQX69YNUilGjYGGB9evx6aeYPRt+fsjMxIIF6NEDmzeLXTczaAqF4ujRo9HR0Xv37iUiY2Pjfv36jRs37tq1a0uWLCGi9evXh4aGil2mPuEYrb2/Tc+Kjh3DmjXlw++HD8eHH8LERJSqGasiJSUlOjp648aNwiR9wcKFC2fPni1iVfqIY7Smbt26tWvXLplMdjA3t1FqKgBYW2P4cEilCAoCP81k+ikvL2/x4sXLli0rKyvr1q3b2bNnxa5I/3CM/o2MjAyZTCaTyS5evCi07Bw4cETTppBKERjI6cnqh8LCwqKiInteU7xOOEarpzz3PHnypPAtsrGxGTZsmFQqDQoK4pF0jDEl3hm0kvT09P3793N6MsZqjmP0hcmTJ69atUpYutHGxmb48OFSqTQwMJDTkzH2GnxRX04ulwtrOowePTo0NJTTkzFWQxyj5c6cOePr62tlZZWXlyd2LYwxfcKTQculpKQACA4OFrsQxpie4Rgtd+7cOQA+vOUcY6yWOEbLcYwyxuqG740CQElJiZWV1fPnz588eWJlZSV2OYwxfcJnowCQlJRUXFzcoUMHzlDGWG1xjAJ8Rc8YUwHHKMAxyhhTAcco8FeMduvWTexCGGP6hx8xobCw0NraGkB+fr5yc1rGGKshPhvFhQsXSktLPTw8OEMZY3XAMco3RhljKuEY5RhljKmEYxQJCQng50uMsboy9EdM+fn5tra2DRo0yM/Pl0gkYpfDGNM/hn42mpiYqFAounTpwhnKGKsbQ49RvqJnjKnI0GM0MTERgLe3t9iFMMb0laHHKJ+NMsZUZNCPmHJychwcHMzNzfPy8kxNeXc/xlhdGPTZaEJCAhF17dqVM5QxVmeGHqPgK3rGmGoMOkZ5/hJjTHUcoxyjjDGVGO4jpvv37zs5OVlbW+fk5BgbG/Q/J4wxVRhufAg3Rn18fDhDGWOqMNwE4St6xphaGG6MKs9GxS6EMabfDDdGhWmgHKOMMRUZ6LDz0tLSuXPnpqWlubq6il0LY0y/Ge6TesYYUwvDvahnjDG14BhljDGVcIwyxphKOEYZY0wlHKOMMaYSjlHGGFPJ/wN8fkq8z+n7NgAAAY16VFh0cmRraXRQS0wgcmRraXQgMjAyMy4wOS42AAB4nHu/b+09BiDgZ0AAESAWBeIGRjaGBCDNyAyhmZg4GDSANDMTmwOYZmFzyADRzIzYGBAl7AxgASagWRABmBlws6Bmw2h2BgWQOLowBg2ziJuBkYGRiYGJWYGZJYOJhTWBlS2DiY09gZ1DgYNTgZNLg4mTW4Gbh4GHl4GXj4GPn4FfgEFAkEFQiIFdOINJmDlBiI9BhAloFhuzMDsbKwsrP5+QoID4L5DH4SGioHj4wKmrRQdAnCf1Ow8UnRQBs19+7T4Q9+jNfhB7XUjTgd1qh/eB2Dm2yw58tZG1B7EN58w5MDWa1QEsrhJ34MZmZTD7fZDYgfb/x8Fqnv3O2c8WwQQWd9HwtHvs3goWT/t3da+B822wmZ99zttn/TgIFv9eru/QoMAKZn9zbXXobawDs7fqrXSI6pm7C8S+zHfDYfmyJXYg9ovYDw4spyrA7rzXfMHhPzMb2P3+rUscOO33g8XTpmoeKMndZwtiiwEA83tlUb/XX1UAAAH8elRYdE1PTCByZGtpdCAyMDIzLjA5LjYAAHicfVRbbhsxDPz3KXiBFcSnxM/YDoqgyBpo3d6h/7k/SspwVgGEaC1C0s6ORM7IJ8j26/rz3wd8NrqeTgD1m5+7w1+utZ7eIQdwfv3xtsPl/nJ+rlxuf/b7b6AKhPFNPF+xL/fb+3MF4QKbleqtOcPGpblQbFFLHe34lhKp8d66EWxUmKS5LpAMN9ikcONmDhuWrtW0L5CSnFJqo84Ntlq4I+qKUx+7o4t7MhkKIS6A9qDsLtUMqNRgxhVjSyAXaZE7B1C1daUFsCcw0pXekQCLGkm3BdBhzxyctKHn1mxGvABiaBTL6CbCwVgFSVeMkeEtKbGKdM+RUI+yr6AUUIy6uLLlKVHZl5tzbE6lCZonkVKttGRMdaSghcyxXNzjE1kBNRLXQt08CrglAKmuSompjpWm2DEpmVD7kjLVaZEEivEoasPOy3T6oFS00DF1qs5x0hXSAxkWimKH4GFLiYSWHqL6kNzEmwwqJ++rhF7365fr9Lhg59t+PS5YPnTcopgAH1cFo8txH/LRw/QxATusLdHbYWCJ3g+bYnQ/zIjZZ89RBsTJXDhWaPIQjsCTWXAEmVyBI+gkP45gk8w4Qpv0xBH6pBuO4JM+EhnQLIOM8LkwTuzT3ln/udo5f/4Vxvj0H3QGAF63ugZPAAABBnpUWHRTTUlMRVMgcmRraXQgMjAyMy4wOS42AAB4nB1QSY4DQQj7yhwTqRphdtTKqe/JI/KNPH6o5oQs44Xr+nzxnXm8r8fr8/xc11uuGXl+8fd7HEHcmb0OpWzTdR4+S1SsQ0jFahAjTc1cB6icI26IU8rWwaQFuN+HaF9MARPgJlUb5xLi0tyIkuX4DeKetY/GxKqwQB5iPQhTiyd6n2mErJNHOGzCgdggcZPAZtU7gEmJ5Toxzu22peA6UkJpyEnkwizDMELYlB2LtlnX6SQVk3pkmCE8bkHpmETTTODT8cwRhMUmdaJUN8kR2D/i1u4thIl2/8hGG3e1sE4bIW7pElnP3z9luVGQoUe8CgAAAABJRU5ErkJggg=="
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "\n",
    "\n",
    "smiles = df.sample(1)['Drug'].iloc[0]\n",
    "smiles\n",
    "while len(smiles)> 40:\n",
    "    smiles = df.sample(1)['Drug'].iloc[0]\n",
    "    print(smiles)\n",
    "mol = dm.to_mol(smiles)\n",
    "mol"
   ],
   "metadata": {
    "collapsed": false,
    "ExecuteTime": {
     "end_time": "2024-09-19T13:30:39.634480730Z",
     "start_time": "2024-09-19T13:30:39.610932407Z"
    }
   }
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "outputs": [],
   "source": [
    "confs = dm.conformers.generate(mol)"
   ],
   "metadata": {
    "collapsed": false,
    "ExecuteTime": {
     "end_time": "2024-09-19T13:33:52.448276524Z",
     "start_time": "2024-09-19T13:33:51.186564134Z"
    }
   }
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "outputs": [
    {
     "data": {
      "text/plain": "",
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "c258ba1bb7eb4c1b9f34185518c0602b"
      }
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": "NGLWidget()",
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "71724881203a404595411d7bd87731a2"
      }
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "dm.viz.conformers(confs)"
   ],
   "metadata": {
    "collapsed": false,
    "ExecuteTime": {
     "end_time": "2024-09-19T13:34:42.472268450Z",
     "start_time": "2024-09-19T13:34:42.424962776Z"
    }
   }
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "outputs": [],
   "source": [],
   "metadata": {
    "collapsed": false
   }
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 2
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython2",
   "version": "2.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 0
}
