{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "from rdkit import Chem"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "from smiles_canonicalization import canonicalize_molecule_smiles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAIAAADCEh9HAAAABmJLR0QA/wD/AP+gvaeTAAAckElEQVR4nO3deVhTV/4/8HcIuyhBXECqIuhY0apTEJcIVkVZGlSYxqVKnW6OrY84td+WmXamjL/n6TP2W+2ELm7tt5Z2HreAYMANpUWCWwWrBdwri4IsQtghSHJ+f1waIyoiAS7hfl5/1XOXfFLbd84995x7RYwxEEII6SwLvgsghBDzRjFKCCEmoRglhBCTUIwSQohJKEYJIcQkFKOE9GotLcjKwo0bDzTW1yMrC3V1PNVEHkQxSkivc+sW1OrWf66qgo8PJk1CXt79HbKz4eODCxd4qY60RTFKeHP58mW9Xs93Fb1IXh5iYjBzJkaOxMsvw3hK9717WLeOv8pIuyhGSY/S6/UZGRkrV660srLy8vKSSCS//PIL30Xx7Px5/POfmDABHh74619x8iTs7TFtGmpq7u+zahWSkpCQwF+V5PEs+S6ACEJzc3NqampCQsKBAwfKysoM7bW1tbNmzcrMzPzDH/7AY3k9T6/HL78gKQm7d+PatdZGJycEBEAmQ3g4HBwe2F8qRXk51q3DvHltNxHeUYySbtTY2Hj8+HGlUqlSqaqrq7lGd3f3BQsWTJkyxdfXd/bs2cXFxdOnT09OTp4+fTq/1fYAnQ6nT0OpRFwciotbGwcNQnAw5HIEBsLa+rHHfvopvLwQHY3Nm3umWNJRFKOk62k0muPHjyclJSUkJNT9fjvZy8srNDRUJpPNnDnTsOf169cXL1588ODBefPmxcXFBQUF8VRy92poaEhJUcfHByYno6qqtdHTE2FhCAvDtGmw6MDo2ogR+Mc/8M9/4pVXurVY8vQYIV2krKwsNjZWJpNZ/96nsrCw8Pb2jo6OvnLlyuOOamlpef311wFYW1vv3r27JwvubpWVlfv27YuIiHBwcADg6dkEMC8vFhXF1Gqm1z/2wNpatm8fW7qUxcSw8nIGsF27GGNMq2XjxjGplJ06xQCmVvfYVyHtoRglpsrLy1MoFFKp1OL3PpVYLJZKpQqF4vbt2x05g16vj4qKAiASiTZv3tzdBXe34uLirVu3zps3z8rKyvBzMm3atK1bc65fb+/AigoWG8vkctavHwMYwKZMeSBGGWOpqQxg771HMdqLUIySTsrJydm4caNUKhWJRFxY2NraymSy7du3l5aWPvHw0tLSNrspFAouiKOiovTtdNV6q/z8fIVCERAQYGlp+VQ/J2VlLDaWyWTMyqo1PS0smLc3i45mV6+2jVHG2MsvM1tbitFehGKUPJ2cnJzo6OixY8caxoX69esnk8liY2Nramo6eJKamhpvb28PD4/rD3bPfvjhB64H9+c///nevXvdUH7Xa+fnpKSkpJ0Db95kCgWTSplI1JqeYjGTSplCwYqK7u/2cIzeucMkEorRXoRilDxZS0uLWq2OjIx0c3MzpKezs3NERIRKpdJqtU97wrKyMh8fHwCurq4XL1403nTs2DFuJHHhwoUNDQ1d9yW63ubNm0ePHm34F+Lo6Lhs2TKlUllXV9fOUTk5LDqaeXu3RifA7OyYTMZiY5lG84j9NRrm7c2OHHmgcccO5u3NfvmlS78P6SyKUfJYjY2NKpVq1apVQ4YMMYTFiBEjIiMjjx07ZmJvsa6ujrsvL5FITpw4Ybzp7NmzgwYNAjBr1qyqqirTvkQ3Wr9+vfHPSVNT0+P21Ol0GRkZ7777bmDg/zOkp5MTi4hg+/ez+vr2PiUzk1VWdn3xpAtRjJK26uvrVSpVRERE//79Denp4eERGRmpVqu7cNRSq9UuXboUgI2NjVKpNN506dKl4cOHA5gwYUIH71P1vGvXrp04caKlpeVxOxh68cOGDfv9XpPV+PH3Vq9mKSmsufmxZ9bpmFrNoqLYmDEMYF9/3S31k65CMUru+/LLLwcPHiwWi7n/50Ui0ZQpU/7973+3M13JRHq9nuvTicXibdu2GW8qKip67rnnALi7u1+9erWbCugOj+zFjxw58om9eK2WHTrE3nyTDRly/5LfzY1t3dqT5ZOnRjFKWp08edIwY0kqlW7cuPF6+9Nzus7GjRu5z42KijJur6ysnDFjBoChQ4dmZWX1TDGdptFouFmixr14Ly+vqKio9nvxDQ1MpWIREczR8X56uruzyEimVjOdrie/BOkMilHSavXq1QAGDBjAS9dv586d3DyhNWvW6IySo66uLiQkBICDg8PRo0d7vrAnun37dptFB1x6RkdHX7p0qZ0DKyvZvn0sIoI5ONxPT8PkfGJGKEZJq4iICAArV67kq4DExEQ7OzsA4eHhjY2NhvZ79+699tpr3DKnPXv28FVeG3l5eX/6058cHR0NXXhLS8s5c+Z88cUX7Q/mFhUVfffd7YAAZml5f5bojBns00/Zb7/1WPmkK1GMklbe3t4A0tLSeKwhLS3N0dERwJw5c6qrqw3ter3+vffe44ZrP/vsMx4r/O2337glW4ZZohYWFrNnz/7222/v3r3bzoHGa72mTdtkPEu0t95CIx1FMUoYY6yhocHa2losFtfW1nItWq22/fmP3SQ7O5ubnerj4/PwMicuvNoMofYAbtHBuHHjDJft9vb2M2bMWLNmTXFxcTsHXrx4MTo6euLEiYYD7ezslix5LTaWpjH1HRSjhDHG1Go1gMmTJxtaDh48aGlp+cYbb/R8MXl5edzjRz08PG7cuGG8KTY2llvm9Oqrr3b3MifDdKVnnnnGEIIDBw6MiIjYt2/fk+bYd8FaL2Iu6EF5BADOnDkDYNq0acYtLS0tzs7OPV+Mu7t7enp6SEjI+fPn/fz8Dh06NHnyZG7TK6+8MnDgwCVLluzcuVOj0ezevdvW1rZrP12r1arV6qSkpH379pWUlHCNw4cPDw4OlslkQUFBhgeOtKHT6U6fPq1UKuPj44uKirhGZ2fnkJAQuVweGBho3c7DRIlZ4zvHSa/w0ksvAdi5c6ehZd68eQD279/PV0m1tbXz588HIJFI0tPTjTedOXOGy/cXXnihq5Y5GRYdDBgwwPB/RwcXHRQUFHD5bjjQ3d39nXfeSU9P19F8JQGgGCWMMcZdt16+fJn7o16vl0gkAIqMH5LR47Ra7ZIlSwDY2NjExcUZb8rNzTUsczKlyIqKitjYWLlc3q9fP0MIctOVMjMzO3gSjUbD9TS7Y60X6f0oRgnjrkAlEomh65STkwNg5MiRvNbFGGMtLS1vvfUWALFYvGPHDuNN+fn53ODjqFGjrl279lSnLSws3L59u0wmM34kKLfo4GlPxdm1a5d5LbUiXYhilLC4uDgAgYGBhpZvvvkGwJIlS3isyhi3zEkkEkVHRxu3V1RUcG9wGjp06Pnz5594nps3b7aZrmR4JGj7N9wJaQfFKGHclEzjhHrzzTcB8DtDs41vv/2WW+a0du3aNsucgoODATg4OKSkpDzyWO6+OTcxlmNnZ8fdN9c88uF0hDwNilHC/Pz8ABw6dMjQws1zPHnyJI9VPSwhIYG7L//yyy83Gz0fSavVLlu2jBtC3bt3L9eo0+kyMzOjo6ONX93s5OQkl8tjY2MN02MJMZ2IMWbarX5i3u7duyeRSBobG8vLy7nb37W1tU5OThYWFtXV1dzqzN4jLS1t0aJF1dXVc+fOTUhIMDwEhDH2/vvvb9q0SSwWr1mzpqmp6cCBA6WlpdxWV1fXRYsWhYeHz5o163HTlQjpPL5znPAsMzMTwNixYw0tqampAHx9fXmsqh3Z2dnc4zunTJlSVlZmvOnjjz8WiUTcI58BuLu7c/fNadYR6VYdeD026dMeOfG+TUuvMmHChIyMjDFjxpw7d87f37+wsNCw6YMPPnB3d7979+5rr7124cKFvLy8mJiYmTNnWnTkNfCEdBb95yV0Z8+eBTB16tR2WnqbUaNGpaenT548+caNG9nZ2Yb22trawsJCKyurL7/8ctKkSTxWSASFFoMK3eNitNf2RjkuLi5paWlqtfrFF180NJ47d06n03l7e/e2IV3St1FvVNAqKyuvX79ub29veARRXl5eaWnp4MGDPTw8+K3tiRwdHWUymXFLLx+OIH0VxaignTlzhjHm4+PDTcmEmSdR7x+OIH0SxaigPXz9btZJZBbDEaTvoRgVNK7vaRya5tsbNaPhCNLHUIwKF2Ps3LlzMIpRrVZ74cIFCwuLKVOm8FpaZ5jvDwAxdxSjwnXlyhWNRjN8+HDupR0Azp8/r9Vqx48fb/zMTXNh1sMRxKxRjAqX2U28b59ZF0/MGsWocJnjxPvHMevhCGLuKEaFqy/1Rs16OIKYO4pRgaqvr8/NzbWysnr++ee5lrKysoKCgv79+z/77LP81tYJ5vsDQPoAilGBOnfuXEtLy6RJkwzrJk+dOgVg6tSpYrGY19I6w3yHI0gfQDEqUA9338x67jrFKOERxahAPZw7D0/FNxdlZWX5+fn9+/cfN24c37UQIaIYFaiff/4ZRn1P7pUbAHx9ffksq1PMejiC9AEUo0KUn59fXFzs7Ozs6enJtWRnZ9fV1Y0ePXrIkCH81tYJZj0cQfoAilEh4q7fp0+fbnjPsFmPLZrvcATpGyhGhagvTbw36+EI0jdQjApRX5p4n5OTU1dX5+npaY7DEaRvoJeICE5zc/OFCxdEIpGPj4+hcffu3adPnzbH9xeZ7w8A6TMoRoWlpqYmJiamqalp9OjREonE0D5p0iRzzFCY83AE6TPool4QKioqvv/++9DQ0CFDhnz00Udubm4FBQVKpZLvuroA9UYJ70SMMb5rIN2loKAgMTExISEhIyNDp9MBEIvFfn5+IpHop59+EovFW7ZsWbVqFd9ldl5VVZWzs7O1tXV1dbW1tTXf5RCBoov6PujmzZtJSUlKpfLUqVPcz6SNjc3s2bNlMtmSJUtcXFwAfPLJJ3//+9//8pe/3Lx5c+PGjXyX3Elnz57V6/Xe3t6UoYRHFKN9R25urlKpVCqVly5d4lrs7Ozmzp0rl8sXLlzo6OhovHNUVJSLi8sbb7zxySef1NXVff755xYW5jfCQ1f0pDegGDVver3+1KlTycnJ+/fvv379Otc4cODAF198MTQ0NCQkpF+/fo87duXKlU5OTkuXLv3qq6+Ki4t37dpla2vbU4V3Dbq/RHoDGhs1Szqd7vTp01zf886dO1zj4MGDg4KC5HJ5UFCQlZVVB0+Vnp6+YMGC6urq2bNnJyYmmtFjjxljgwcPrqioKCwsHD58ON/lEOGiGDUnjY2Nx48fVyqVKpWqurqaaxw1alRoaKhcLpdKpYbFnU8lNzc3MDCwqKjI29v70KFD5jKP/dq1a2PHjnV1dS0uLua7FiJodFFvBjQaTVJSUnJy8uHDh+vq6rhGLy+v0NBQmUw2c+ZME88/fvz4jIyMwMDArKys6dOnHz16dPTo0SZX3e0MTwbguxAidBSjvVd5efnhw4eVSmVKSkpzczMACwsLb29vmUy2bNmysWPHduFnubu7nzp1SiaTnTlzxs/P7/Dhw5MnT+7C83cHGhglvQUjvUxeXp5CoZBKpYZb52KxWCqVKhSKoqKibv3o2trawMBAABKJ5MSJE936WR1XXFy8devWhQsXNjc3G7dzb5HqPXUSwaKx0d4iNzc3OTk5KSnp5MmTXIutrW1AQEBoaOiiRYt6bLyyubl55cqVe/bssbGx+e9///vSSy/1zOc+jFs7kJycnJaW1tLSAuDIkSNcygNobGx0dHRkjFVVVbUzG4GQnsB3jhPGGPvmm28MfyMSiWT58uXx8fH19fW8FKPX69evXw9ALBZv3769hz/9119/3bBhg/ECfzs7u4ULF3733Xcajcaw24kTJwA8//zzPVweIQ+jsdFeISgoyDBdKTAwkN81OSKRaPPmzUOGDPnb3/62evXq4uLif/3rX939odzagb179165coVrsbe3nzNnjlwuDwsL69+/f5v9aWCU9B4Uo72Cm5tbaWlp56YrdZOoqKihQ4e++eabGzZsqKioiImJ6fJlTobZr/Hx8UVFRVyjs7NzSEiIXC6fP3++jY3NIw/U6/UpKSmgGCW9A42NkvYcOHBg2bJljY2N4eHhu3btelyuPZWmpqaMjIykpKS9e/eWlpZyjSNGjAgKCpLJZMHBwZaWj/51N8RuXFxcSUkJN/rx+eefm14SISbhe1SB9HZpaWncevw5c+bU1NR0+jz19fUqlSoiIsJ4oZSHh0dkZKRardbr9e0cGB8fv2LFCuMHpLq4uHC943fffbedYwnpARSj5Mmys7Pd3NwA+Pj4lJWVPdWxd+/ejY2Nlclkxj1ZLy+v6Ojo3Nzcdg7UaDT79u2LiIhwcHAwPjAqKoqL3f3793MPAVixYkWbuVCE9CSKUdIhN2/eHDNmDABPT88bN248cf/CwsLt27fLZDLD6n4LCwupVLpx48br16+3c2B5eTkXu8b32bjYvXz5cpudf/zxR65vGxAQYEpPmRBTUIySjiopKeFmvLu6ul64cOGR+9y4cePjjz/28fEx3C6zsbEJCQn5+uuv2+/G5ufnKxSKgIAAw8CoYdHB7du32zkwMzOTm1Q7ZcqU8vJyk74hIZ1CMUqeQm1t7fz58wFIJJL09PSHd1AoFFwI2tnZyWSy2NjYqqqqdk6Yk5OzceNG44eqcIsOFApFSUlJB6v67bffuIcAjBs3rqCgoDNfjBATUIySp6PVahcvXsx1M+Pi4tpsLSgoePXVV1UqVWNjYzsnycnJiY6OHjdunOGy3d7enovd6urqTlR1584d7iEAw4YNu3jxYifOQEinUYySp9bS0rJ69WruunvHjh0dP0qtVkdGRj7zzDOG9HR2do6IiFCpVE1NTSZWpdFo/P39ATg5OWVkZJh4NkI6jmKUdBL3BieRSBQdHd3Obo2NjceOHYuMjBw6dKghPYcPH75q1SqVStW1d9ibmpq4hwDY29sfPHiwC89MSDto+j3pvC1btqxdu1av169du1ahUBgvc2poaEhNTVUqlQcOHKipqeEaPTw8ZDKZKU+YfiKdTvf222/v2LHD0tJy27Ztr7/+end8ShdITUVKCior4eCAmTOxcCEes+iAmAG+c5yYt4SEBG7ypq+vb319/a1bt2JjY+VyufFTl7jpSpmZmT1Tkl6v//DDDwFYWtps23anZz70KdTVseBgJhIxPz/2+uts/nxmbc0mTWLtTkggvRnFKDFVamoqN8dTLBYbolMsFvv7+//nP//Jz8/npaqYmBh//1yAvf8+612rnFatYra27Pjx+y3Z2WzIEObnx19NxCQUo6QL7Nmzx5ChEydOVCgUxcXFfBfF4uOZrS0DWEQE6y2rnEpLmZUVe//9tu3/938MYHRnzDyZ36vJSS+0ZMmSW7dufffdd4WFhRcvXly3bp2rqyvfRSE8HAcPYsAA/PADwsPR0MBHEVotDh3CG28gOxsAMjJw7x7mzm27G/c46p9+6unySFegUW3SNVxdXVeuXMl3FW3NmYPUVISEIDkZc+YgORmDBvXIBzc24vhxKJVQqcC9w3XYMDz3HLi3YY8Y0XZ/V1dYW4NecWqeKEZJH+fjg9OnERiIs2cxaxaOHEE3vtO+ogIqFRIScOwYmppaG//4R4SFYfFiAOAmM+h0bQ9kDHo93aw3U/TXRvo+T0+o1QgOxsWL8PPDkSN49tmuPH9RERITkZjAjmZPsCgrAQALC8ycibAwhIVh1Kj7u3JLDwoLMX5821O0tHRnwJNuRDFKBMHVFWlpWLAAajWkUiQlYcYMU8+ZlweVCkolTp0CYwBE115Y9Owf8xAWhoUL4eLyiGOkUtja4vBhBAc/0J6cDOARY6bEHND0eyIgWi2WL0d8PPr1g1LZNso6KDcXSiWSk5GV1dpiZ4e5cyGXY8ECGD1a+iH5+XB3xzvvYMsWxMUhNLS1PSsLgYHw9cWhQ50piPCNYpQIi06Ht97C11/D0hI7duDVV5/u8MpKuLjg3j0AcHKCTIawMAQGwt7+8ccYcvf8eRQUYPBgREQgLg5Tp8LTE3fuQK2Gry8SEzF4sClfjfCFYpQIDmPYsAEbNkAkwv/+L/7nf57u8BUr4OCA8HDMno3fn0n9EJ0OJ08iIQEJCSgoaG0cOBB79yIgAABOnsSxY7hzB05O8PdHUBC6+o2BpMdQjBKB+uIL/PWv2LABo0dj0yYsX4533rm/9dNPkZ6OpKTWP96+jQ8+wPffP+Gczc24ri4Zv/cjHDiAsrLW1mHDsGgRwsMxaxbdi++T6C+VCNTatZg6Fb6+iIlBVhZychASgrFjW7feutU6X55z717rjM9HMp4katviUKL/Lxob4e6OBQsgl2PGDOpp9m0Uo0S4fH1b/8HCApMnY+1apKS03ae+HgsXoqkJly8jIABTp+Ljj1s3VVYiORn79yMlBY2NrY3ukxxKXvnGJWACJk7skS9B+EcxSggAbNoEf3/s3o1lyx5o79cPx48jLw+rVuHYsdbGCxfw3ns4caL1XpOFBWbMaJ0k6ukJ4OUeLp7wi2KUEACYORNLl2L9egQHP2LSkoUFjJ78B0dHHD8OsRhSKeRyvPQS3Nx6sljSu9CQDSGtPvsMjY348MNHbBo5EomJ9/84ahT270d5OTIysG4dZajQUYwS0srFBR99hG3bkJn55J3DwuDk1P01EXNAMUrIfZGRmDAB774LmgdIOo7GRgm5z9ISW7bAzw+3b/NdCjEf1Bsl5AFSKVauxM2bfNdBzAfFKCFtbdrUU093Jn0CLQYlQlddjYoKeHg80FhaCq32EU+pJ+RhFKOEAMDbb8PJCevXw9mZ71KIuaEYJQRNTXB0hE6Hqio4OPBdDTE3NDZKCLKy0NyMCRMoQ0lnUIwSgjNnAGDaNL7rIOaJYpQQnD0LAFOn8l0HMU8Uo4RQb5SYhG4xEaErLoabGyQSVFTQ45VJZ9B/NUTouK6ory9lKOkk+g+HCB03MEpX9KTTKEaJ0HG9Ubq/RDqNxkaJoLW0QCJBQwPKymgdPekk6o0SQfv1V9TXY8wYylDSefS8USJobr8ePv5CVsEfFwET+K6FmCuKUSJoQ3/aMzTte8gHUoySTqOLeiJsNPOemIxuMREBq6rCwIGwtUV1Nays+K6GmCvqjRIBO30ajMHHhzKUmIJilAgYzbwnXYFilAgYzbwnXYHGRolQMQZnZ2g0uH0bbm58V0PMGPVGiVBdvQqNBsOGUYYSE1GMEqHiruhnzOC7DmL2KEaJUNEj70kXoRglQkUT70kXocWgRKjmz0f//nj+eb7rIGaP7tQTQaqqgkTCdxGkj6CLeiIkJ05g7lxYW8PJCba2CArCzz/zXRMxexSjRDAOHEBAAMRiJCYiMxP79qG2Fv7+OHasdYfUVBw5giNHcOoUr4USM0MX9UQYmpowciQmTcLhwxCLWxubm+Hnh9JS3LgBS0ts2ICGBgAYNgzr1vFYLDEvFKNEGA4cwKJFOHoU8+c/0K5UYvFi/PgjZs/mqTJi9uiingjDr78CwLhxbdsnTLi/lZBOoRglwlBbCwBDhrRtHzoUAGpqeroe0odQjBJh6N8fAMrL27aXlQHAgAE9XQ/pQyhGiTBwF+9Xr7Ztv3wZACZO7Ol6SB9Ct5iIMDQ04Jln4O+PhASIRK2Nej3mzsWNG7h5kx6ATzqNeqNEGOzt8fnnUKmwfDnOn4dGg59/RlgY1Gp89RVlKDEFrakngrFiBfr1wz/+AW/v1pbJk3HwIAIDeS2LmD26qCfCU1qKykoMGoTBg/kuhfQFFKOEEGISGhslhBCTUIwSQohJKEYJIcQkFKOEEGISilFCCDHJ/wdHQnZEzt3HwwAAARV6VFh0cmRraXRQS0wgcmRraXQgMjAyMy4wMy4zAAB4nHu/b+09BiDgZYAAJiDmgeIGRjaGBCDNyMzmoAGkmVnYHDJANDMjEgMqwwCimVjYITRcB7uCFtgEFg6wBDMTB1jgP5IR3AyMDIxMGUxMzAnMLBlMLKwKrGwaQJ0J7BwKHJwaTBxcCuzcGUzcjAkijEAdbIzc7CzMTOKzQOZCXc3Ak2pUfqB6zf19II7oXukDEiJzbEDsFHf2A8Ls++xB7BAP/f1NST/AbN+cm3axfnlg9ibXt/bzmjaC2ZoSQQ68916D2XK/r9lq3OfYD2K/z5tt/3zVUTD7uI6mQ4V/N5gtw55qf3WBwwEQ+23Vyv1s02rB4mIAVeA7BtKxTD0AAAF2elRYdE1PTCByZGtpdCAyMDIzLjAzLjMAAHicfVPbTsMwDH3vV/gHGvmW2wMPWzsNBGslGPsH3vl/YXfa0kFFUlduchzH57gd+HgfX7++4T547DoA/OeptcJFELE7gTuwPxxfJhjOu/1tZZg/p/MHEPuDPh+xu/N8uq0QDNBLKIk1EvQYVFJJAhhwGS2WHcm2L0rJ96li3ALKFUgkWewKQYvGShtAdSCGVDTVbMCqGDFtAKMB7WasKao5VbCUrczJcBRKtBKqOVJSNrb+4jJMIIELZ44eoJxJN3BlyUuoNS/cRLEbxA1gtQMpMKmwQE8hqh1ZVkAYno9PBJfd25PeqUeYgUMyRmPxKK9qk3oiQ2IoVZOiy4VYC6Xf5/fXBHQPWyQzHlgxqRdQTbKMGxkO0/jQFtdG2c/T2BrFJ7duUDNpmqtbU9ZnbPqRWWoyiVluahgUSiOdzGqjls0IV6yRL9CKHPUgXpWt/uJ1cetS/Pv2v5jf/QAWEKpqgklGFwAAAMd6VFh0U01JTEVTIHJka2l0IDIwMjMuMDMuMwAAeJwdjztuAzEMBa8SIM0uQhH8i8TClXv7AIYrXcOHD+WOetAMH++L11rH/fdxruP1+Hsft+f5eo73ufjncwzFDDGHQWgaGQrXkB7VBAiJi1zimzHrVGC0NK9OCCMtanZURs5wtUIs3Bospcx2MaZrVP/RjIRLUVKm9DtN5pdhsuqpfa5N+4aETQUGo5tJY4LRlWIn2xuby7Iw6AOIKqUL9Q4xim2qrj3h/PwDCjI0jeW9YP8AAAAASUVORK5CYII=",
      "text/plain": [
       "<rdkit.Chem.rdchem.Mol at 0x7f2d5e0d3cf0>"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "Chem.MolFromSmiles('CC1=CC=C(C#N)C([N+](=O)[O-])=C1')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'CC1=CC=C(C#N)C([N+](=O)[O-])=C1'"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "canonicalize_molecule_smiles(Chem.MolToSmiles(Chem.MolFromInchi(Chem.MolToInchi(Chem.MolFromSmiles('CC1=CC=C(C#N)C([N+](=O)[O-])=C1')))))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "'CC1=CC=C(C#N)C([N+](=O)[O-])=C1' == 'CC1=CC=C(C#N)C([N+](=O)[O-])=C1'"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "lora",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
