{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "01a84d64",
   "metadata": {},
   "source": [
    "# We recommend performing UMLS knowledge retrieval using APIs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "26ae78b0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Collecting umls-api\n",
      "  Downloading umls-api-0.1.0.tar.gz (4.6 kB)\n",
      "  Preparing metadata (setup.py) ... \u001b[?25ldone\n",
      "\u001b[?25hRequirement already satisfied: requests in /home/wxy/anaconda3/envs/arl/lib/python3.7/site-packages (from umls-api) (2.28.2)\n",
      "Requirement already satisfied: lxml in /home/wxy/anaconda3/envs/arl/lib/python3.7/site-packages (from umls-api) (4.9.1)\n",
      "Collecting cachetools<5.0.0,>=4.0.0\n",
      "  Downloading cachetools-4.2.4-py3-none-any.whl (10 kB)\n",
      "Requirement already satisfied: charset-normalizer<4,>=2 in /home/wxy/anaconda3/envs/arl/lib/python3.7/site-packages (from requests->umls-api) (3.1.0)\n",
      "Requirement already satisfied: idna<4,>=2.5 in /home/wxy/anaconda3/envs/arl/lib/python3.7/site-packages (from requests->umls-api) (3.4)\n",
      "Requirement already satisfied: certifi>=2017.4.17 in /home/wxy/anaconda3/envs/arl/lib/python3.7/site-packages (from requests->umls-api) (2022.12.7)\n",
      "Requirement already satisfied: urllib3<1.27,>=1.21.1 in /home/wxy/anaconda3/envs/arl/lib/python3.7/site-packages (from requests->umls-api) (1.26.15)\n",
      "Building wheels for collected packages: umls-api\n",
      "  Building wheel for umls-api (setup.py) ... \u001b[?25ldone\n",
      "\u001b[?25h  Created wheel for umls-api: filename=umls_api-0.1.0-py3-none-any.whl size=3384 sha256=0834dbcd29a60375621e57da100e2834024f38e471bfde2b7aad52588b4ba9da\n",
      "  Stored in directory: /home/wxy/.cache/pip/wheels/40/d1/1b/52cfe03978dfc09cc52fc981a7a85182ce1891f42ce5af30e9\n",
      "Successfully built umls-api\n",
      "Installing collected packages: cachetools, umls-api\n",
      "  Attempting uninstall: cachetools\n",
      "    Found existing installation: cachetools 5.3.0\n",
      "    Uninstalling cachetools-5.3.0:\n",
      "      Successfully uninstalled cachetools-5.3.0\n",
      "Successfully installed cachetools-4.2.4 umls-api-0.1.0\n"
     ]
    }
   ],
   "source": [
    "!pip install umls-api"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "600fe55b",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import torch\n",
    "import os\n",
    "import pickle\n",
    "import pandas as pd\n",
    "import requests\n",
    "from lxml.html import fromstring\n",
    "from cachetools import cached, TTLCache\n",
    "import umls_api\n",
    "\n",
    "\n",
    "abbr={'RQ':'is related and possibly synonymous with',\n",
    "      'SY':'is asserted to be synonymy of',\n",
    "      'RN':'denotes a narrower concept compared with',\n",
    "      'RB':'denotes a broader concept compared with',\n",
    "      'QB':'can be qualified by',\n",
    "      'PAR':'include',\n",
    "      'CHD':'is part of (belongs to)',    \n",
    "      }\n",
    "\n",
    "\n",
    "TTL_7HRS = TTLCache(maxsize=2, ttl=25200)\n",
    "\n",
    "def cui2name(CUI):\n",
    "    res = umls_api.API(api_key='72d06e11-2fa4-4bf1-b702-ee2d852038a7').get_cui(cui=CUI)\n",
    "    return res['result']['name']\n",
    "def link2name(link):\n",
    "    res = umls_api.API(api_key='72d06e11-2fa4-4bf1-b702-ee2d852038a7').get_snomedct(link=link)\n",
    "    return res['result']['name']\n",
    "\n",
    "class Auth:\n",
    "    def __init__(self, api_key):\n",
    "        self._api_key = api_key\n",
    "\n",
    "    @cached(TTL_7HRS)\n",
    "    def get_single_use_service_ticket(self):\n",
    "        url = 'https://utslogin.nlm.nih.gov/cas/v1/api-key'\n",
    "        headers = {\n",
    "            'Content-type': 'application/x-www-form-urlencoded',\n",
    "            'Accept': 'text/plain',\n",
    "            'User-Agent': 'python'\n",
    "        }\n",
    "        resp = requests.post(\n",
    "            url, data={'apikey': self._api_key}, headers=headers\n",
    "        )\n",
    "        resp.raise_for_status()\n",
    "        html = fromstring(resp.text)\n",
    "        ticket_granting_ticket_url = html.xpath('//form/@action')[0]\n",
    "\n",
    "        resp = requests.post(\n",
    "            ticket_granting_ticket_url,\n",
    "            data={'service': 'http://umlsks.nlm.nih.gov'},\n",
    "            headers=headers\n",
    "        )\n",
    "        resp.raise_for_status()\n",
    "        single_use_service_ticket = resp.text\n",
    "        return single_use_service_ticket\n",
    "\n",
    "class API:\n",
    "    BASE_URL = 'https://uts-ws.nlm.nih.gov/rest'\n",
    "                # https://uts-ws.nlm.nih.gov/rest/content/current/CUI/C0155502/definitions?apiKey=YOUR_APIKEY\n",
    "\n",
    "    def __init__(self, *, api_key, version='current'):\n",
    "        self._auth = Auth(api_key=api_key)\n",
    "        self._version = version\n",
    "        self.api_key=api_key\n",
    "        self.foreign=['SCTSPA','MSHPOR','MSHSPA','MSHCZE','MSHSWE','MSHNOR']\n",
    "\n",
    "    def get_cui(self, cui):\n",
    "        url = f'{self.BASE_URL}/content/{self._version}/CUI/{cui}'\n",
    "        return self._get(url=url)\n",
    "    \n",
    "    def get_name(self, cui):\n",
    "        url = f'{self.BASE_URL}/content/{self._version}/CUI/{cui}'\n",
    "        return self._get(url=url)['result']['name']\n",
    "    \n",
    "    def get_def(self, cui):\n",
    "        defi=[]\n",
    "        url = f'{self.BASE_URL}/content/{self._version}/CUI/{cui}/definitions?apiKey='+self.api_key\n",
    "        try:\n",
    "            ret = self._get(url=url)['result']\n",
    "            for source in ret:\n",
    "                if source['rootSource'] not in self.foreign:\n",
    "                    defi.append(source['value'])\n",
    "            res=defi[0]\n",
    "            for r in defi:\n",
    "                if len(r)< len(res):\n",
    "                    res=r\n",
    "            return res\n",
    "        except:\n",
    "            return 'HTTPError'\n",
    "        \n",
    "    def get_defall(self, cui):\n",
    "        url = f'{self.BASE_URL}/content/{self._version}/CUI/{cui}/definitions?apiKey='+self.api_key\n",
    "        return self._get(url=url)['result']\n",
    "    def get_rel(self, cui):\n",
    "        url = f'{self.BASE_URL}/content/{self._version}/CUI/{cui}/relations?apiKey='+self.api_key\n",
    "        total= self._get(url=url)['result']\n",
    "        r=[]\n",
    "        print('Query CUI:',cui)\n",
    "        for info in total:\n",
    "            source=info['rootSource']\n",
    "            if len(source)!=6 or source=='MEDCIN':\n",
    "                if source=='KCD5':\n",
    "                    continue\n",
    "                try:\n",
    "                    head=info['relatedFromIdName'] \n",
    "                except KeyError:\n",
    "                    # head='XXX '\n",
    "                    head=cui2name(cui)\n",
    "                try:\n",
    "                # if hasattr(info, \"relatedIdName\"):\n",
    "                    tail=info[\"relatedIdName\"]\n",
    "                    print('relatedId:',tail)\n",
    "                except KeyError:\n",
    "                    print('relatedId:',info[\"relatedId\"])\n",
    "                    if info[\"relatedId\"].split('/')[-2]=='CUI':\n",
    "                        tail=cui2name(info[\"relatedId\"].split('/')[-1])\n",
    "                    else:\n",
    "                        tail=link2name(info[\"relatedId\"])\n",
    "                try:\n",
    "                    rel_label=info['additionalRelationLabel']\n",
    "                    if rel_label==\"\":\n",
    "                        rel_label=info['relationLabel']\n",
    "                    print('RelationLabel:',rel_label)\n",
    "                except KeyError:\n",
    "                    print('RelationLabel:',info['relationLabel'])\n",
    "                    rel_label=info['relationLabel']\n",
    "                if rel_label=='RO':\n",
    "                    continue\n",
    "                if rel_label in abbr.keys():\n",
    "                    rel_label=abbr[rel_label]\n",
    "                if rel_label==\"inverse_isa\":\n",
    "                    rel=' '.join([tail,' is a ',head])\n",
    "                else:\n",
    "                    rel=' '.join([head,rel_label,tail])\n",
    "\n",
    "                r.append([rel,source])\n",
    "        return r\n",
    "\n",
    "            \n",
    "    \n",
    "    def get_cui_code(self, keyword):\n",
    "        url = f'{self.BASE_URL}/search/{self._version}/?string={keyword}'\n",
    "        candidates= self._get(url=url)['result']['results']\n",
    "        for i in range(3):\n",
    "            cui=candidates[i]['ui']\n",
    "            name=candidates[i]['name']\n",
    "            print(f'No.{i+1} => CUI = {cui}, Concept Name: {name}')\n",
    "        return candidates[0]['ui']\n",
    "\n",
    "    def _get(self, url):\n",
    "        ticket = self._auth.get_single_use_service_ticket()\n",
    "        resp = requests.get(url, params={'ticket': ticket})\n",
    "        resp.raise_for_status()\n",
    "        return resp.json()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "dddd9bc3",
   "metadata": {},
   "source": [
    "# Definition Retrieval"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "fd80f806",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "C2712342: Bladder stone (substance): A concretion in the urinary bladder.\n"
     ]
    }
   ],
   "source": [
    "CUI='C2712342'\n",
    "cui_name= API(api_key='72d06e11-2fa4-4bf1-b702-ee2d852038a7').get_name(cui=CUI)\n",
    "cui_def = API(api_key='72d06e11-2fa4-4bf1-b702-ee2d852038a7').get_def(cui=CUI)\n",
    "print(\": \".join([CUI, cui_name, cui_def]))"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "bfbefc2b",
   "metadata": {},
   "source": [
    "# Relationship Retrieval"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "cb34a0d9",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Query CUI: C2712342\n",
      "relatedId: Urinary bladder calculus specimen\n",
      "RelationLabel: specimen_substance_of\n",
      "relatedId: Urinary bladder stone (disorder)\n",
      "RelationLabel: RO\n",
      "relatedId: Analysis of calculus of urinary bladder\n",
      "RelationLabel: component_of\n",
      "relatedId: Urinary Stone\n",
      "RelationLabel: isa\n",
      "relatedId: Urinary system calculus\n",
      "RelationLabel: isa\n",
      "[['Bladder stone specimen_substance_of Urinary bladder calculus specimen', 'SNOMEDCT_US'], ['Bladder stone component_of Analysis of calculus of urinary bladder', 'SNOMEDCT_US'], ['Urinary Bladder Stone isa Urinary Stone', 'NCI'], ['Bladder stone isa Urinary system calculus', 'SNOMEDCT_US']]\n"
     ]
    }
   ],
   "source": [
    "cui_rel = API(api_key='72d06e11-2fa4-4bf1-b702-ee2d852038a7').get_rel(cui=CUI)\n",
    "print(cui_rel)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python [conda env:arl]",
   "language": "python",
   "name": "conda-env-arl-py"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
