{
    "cells": [
        {
            "attachments": {},
            "cell_type": "markdown",
            "metadata": {},
            "source": [
                "# MIMIC 4 data - dataset construction prescriptions"
            ]
        },
        {
            "attachments": {},
            "cell_type": "markdown",
            "metadata": {},
            "source": [
                "Code taken from GRU-ODE-Bayes preprocessing; simplified and adapted for MIMIC 4 1.0"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 1,
            "metadata": {},
            "outputs": [],
            "source": [
                "import os\n",
                "import pathlib\n",
                "\n",
                "p_project = str(pathlib.Path(os.getcwd()).parents[1])"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 2,
            "metadata": {},
            "outputs": [],
            "source": [
                "import pandas as pd\n",
                "from datetime import datetime\n",
                "import numpy as np"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 3,
            "metadata": {},
            "outputs": [],
            "source": [
                "pd.set_option('display.max_rows', 50)\n",
                "pd.set_option('display.max_columns', 300)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 4,
            "metadata": {},
            "outputs": [],
            "source": [
                "path_data = p_project + '/data/original/mimic4'\n",
                "path_temp = p_project + '/data/mimic4'"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 5,
            "metadata": {},
            "outputs": [],
            "source": [
                "adm = pd.read_csv(path_temp + '/processed/admissions_processed.csv')"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 7,
            "metadata": {},
            "outputs": [
                {
                    "name": "stderr",
                    "output_type": "stream",
                    "text": [
                        "/tmp/ipykernel_4096557/807499757.py:2: DtypeWarning: Columns (7) have mixed types. Specify dtype option on import or set low_memory=False.\n",
                        "  presc=pd.read_csv(path_data + '/hosp/prescriptions.csv.gz')\n"
                    ]
                },
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "Number of patients remaining in the database: \n",
                        "44057\n"
                    ]
                },
                {
                    "data": {
                        "text/html": [
                            "<div>\n",
                            "<style scoped>\n",
                            "    .dataframe tbody tr th:only-of-type {\n",
                            "        vertical-align: middle;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe tbody tr th {\n",
                            "        vertical-align: top;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe thead th {\n",
                            "        text-align: right;\n",
                            "    }\n",
                            "</style>\n",
                            "<table border=\"1\" class=\"dataframe\">\n",
                            "  <thead>\n",
                            "    <tr style=\"text-align: right;\">\n",
                            "      <th></th>\n",
                            "      <th>subject_id</th>\n",
                            "      <th>hadm_id</th>\n",
                            "      <th>pharmacy_id</th>\n",
                            "      <th>starttime</th>\n",
                            "      <th>stoptime</th>\n",
                            "      <th>drug_type</th>\n",
                            "      <th>drug</th>\n",
                            "      <th>gsn</th>\n",
                            "      <th>ndc</th>\n",
                            "      <th>prod_strength</th>\n",
                            "      <th>form_rx</th>\n",
                            "      <th>dose_val_rx</th>\n",
                            "      <th>dose_unit_rx</th>\n",
                            "      <th>form_val_disp</th>\n",
                            "      <th>form_unit_disp</th>\n",
                            "      <th>doses_per_24_hrs</th>\n",
                            "      <th>route</th>\n",
                            "    </tr>\n",
                            "  </thead>\n",
                            "  <tbody>\n",
                            "    <tr>\n",
                            "      <th>17008042</th>\n",
                            "      <td>17587395</td>\n",
                            "      <td>29827111</td>\n",
                            "      <td>68950197</td>\n",
                            "      <td>2130-04-18 08:00:00</td>\n",
                            "      <td>2130-04-18 11:00:00</td>\n",
                            "      <td>MAIN</td>\n",
                            "      <td>INV-Cabozantinib (Cabozantinib)</td>\n",
                            "      <td>70388.0</td>\n",
                            "      <td>4.238800e+10</td>\n",
                            "      <td>20 mg Tablet</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>20</td>\n",
                            "      <td>mg</td>\n",
                            "      <td>1</td>\n",
                            "      <td>TAB</td>\n",
                            "      <td>1.0</td>\n",
                            "      <td>ORAL</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>17008043</th>\n",
                            "      <td>17587395</td>\n",
                            "      <td>29827111</td>\n",
                            "      <td>31601255</td>\n",
                            "      <td>2130-04-18 08:00:00</td>\n",
                            "      <td>2130-04-23 10:00:00</td>\n",
                            "      <td>MAIN</td>\n",
                            "      <td>INV-Cabozantinib (Cabozantinib)</td>\n",
                            "      <td>70388.0</td>\n",
                            "      <td>4.238800e+10</td>\n",
                            "      <td>20 mg Tablet</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>20</td>\n",
                            "      <td>mg</td>\n",
                            "      <td>1</td>\n",
                            "      <td>TAB</td>\n",
                            "      <td>1.0</td>\n",
                            "      <td>ORAL</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>17008044</th>\n",
                            "      <td>17587395</td>\n",
                            "      <td>29827111</td>\n",
                            "      <td>23581378</td>\n",
                            "      <td>2130-04-23 11:00:00</td>\n",
                            "      <td>2130-05-21 07:00:00</td>\n",
                            "      <td>MAIN</td>\n",
                            "      <td>INV-Cabozantinib (Cabozantinib)</td>\n",
                            "      <td>70388.0</td>\n",
                            "      <td>4.238800e+10</td>\n",
                            "      <td>20 mg Tablet</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>40</td>\n",
                            "      <td>mg</td>\n",
                            "      <td>2</td>\n",
                            "      <td>TAB</td>\n",
                            "      <td>1.0</td>\n",
                            "      <td>ORAL</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>17008049</th>\n",
                            "      <td>15906963</td>\n",
                            "      <td>20494713</td>\n",
                            "      <td>9933337</td>\n",
                            "      <td>2164-11-17 12:00:00</td>\n",
                            "      <td>2164-11-18 11:00:00</td>\n",
                            "      <td>MAIN</td>\n",
                            "      <td>Fentanyl Citrate</td>\n",
                            "      <td>41384.0</td>\n",
                            "      <td>4.099093e+08</td>\n",
                            "      <td>100mcg/2mL Amp</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>25-100</td>\n",
                            "      <td>mcg</td>\n",
                            "      <td>0.5-2</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>1.0</td>\n",
                            "      <td>IV</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>17008051</th>\n",
                            "      <td>17961555</td>\n",
                            "      <td>22879995</td>\n",
                            "      <td>50647416</td>\n",
                            "      <td>2171-01-24 05:00:00</td>\n",
                            "      <td>2171-02-03 20:00:00</td>\n",
                            "      <td>MAIN</td>\n",
                            "      <td>Acetaminophen-Caff-Butalbital</td>\n",
                            "      <td>4451.0</td>\n",
                            "      <td>5.913369e+08</td>\n",
                            "      <td>1 Tablet</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>1-2</td>\n",
                            "      <td>TAB</td>\n",
                            "      <td>1-2</td>\n",
                            "      <td>TAB</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>PO</td>\n",
                            "    </tr>\n",
                            "  </tbody>\n",
                            "</table>\n",
                            "</div>"
                        ],
                        "text/plain": [
                            "          subject_id   hadm_id  pharmacy_id            starttime  \\\n",
                            "17008042    17587395  29827111     68950197  2130-04-18 08:00:00   \n",
                            "17008043    17587395  29827111     31601255  2130-04-18 08:00:00   \n",
                            "17008044    17587395  29827111     23581378  2130-04-23 11:00:00   \n",
                            "17008049    15906963  20494713      9933337  2164-11-17 12:00:00   \n",
                            "17008051    17961555  22879995     50647416  2171-01-24 05:00:00   \n",
                            "\n",
                            "                     stoptime drug_type                             drug  \\\n",
                            "17008042  2130-04-18 11:00:00      MAIN  INV-Cabozantinib (Cabozantinib)   \n",
                            "17008043  2130-04-23 10:00:00      MAIN  INV-Cabozantinib (Cabozantinib)   \n",
                            "17008044  2130-05-21 07:00:00      MAIN  INV-Cabozantinib (Cabozantinib)   \n",
                            "17008049  2164-11-18 11:00:00      MAIN                 Fentanyl Citrate   \n",
                            "17008051  2171-02-03 20:00:00      MAIN    Acetaminophen-Caff-Butalbital   \n",
                            "\n",
                            "              gsn           ndc   prod_strength form_rx dose_val_rx  \\\n",
                            "17008042  70388.0  4.238800e+10    20 mg Tablet     NaN          20   \n",
                            "17008043  70388.0  4.238800e+10    20 mg Tablet     NaN          20   \n",
                            "17008044  70388.0  4.238800e+10    20 mg Tablet     NaN          40   \n",
                            "17008049  41384.0  4.099093e+08  100mcg/2mL Amp     NaN      25-100   \n",
                            "17008051   4451.0  5.913369e+08        1 Tablet     NaN         1-2   \n",
                            "\n",
                            "         dose_unit_rx form_val_disp form_unit_disp  doses_per_24_hrs route  \n",
                            "17008042           mg             1            TAB               1.0  ORAL  \n",
                            "17008043           mg             1            TAB               1.0  ORAL  \n",
                            "17008044           mg             2            TAB               1.0  ORAL  \n",
                            "17008049          mcg         0.5-2             mL               1.0    IV  \n",
                            "17008051          TAB           1-2            TAB               NaN    PO  "
                        ]
                    },
                    "execution_count": 7,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "# only choose previously selected admission ids\n",
                "presc=pd.read_csv(path_data + '/hosp/prescriptions.csv.gz')\n",
                "adm_ids=list(adm['hadm_id'])\n",
                "presc=presc.loc[presc['hadm_id'].isin(adm_ids)]\n",
                "\n",
                "print('Number of patients remaining in the database: ')\n",
                "print(presc['subject_id'].nunique())\n",
                "presc.tail()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 8,
            "metadata": {},
            "outputs": [
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "drug\n",
                        "Sodium Chloride 0.9%  Flush    42564\n",
                        "0.9% Sodium Chloride           38380\n",
                        "Acetaminophen                  36894\n",
                        "Magnesium Sulfate              35644\n",
                        "Heparin                        34172\n",
                        "Potassium Chloride             33721\n",
                        "Bag                            30606\n",
                        "Docusate Sodium                30602\n",
                        "Senna                          29900\n",
                        "5% Dextrose                    29224\n",
                        "Insulin                        28890\n",
                        "Iso-Osmotic Dextrose           28389\n",
                        "Calcium Gluconate              28332\n",
                        "Dextrose 50%                   27926\n",
                        "Glucagon                       25967\n",
                        "Bisacodyl                      24802\n",
                        "Furosemide                     24701\n",
                        "Metoprolol Tartrate            23264\n",
                        "Ondansetron                    23252\n",
                        "Vancomycin                     23075\n",
                        "Name: subject_id, dtype: int64\n"
                    ]
                }
            ],
            "source": [
                "# take only the n most used items\n",
                "n_best=20\n",
                "pat_for_item=presc.groupby('drug')['subject_id'].nunique()\n",
                "frequent_labels=pat_for_item.sort_values(ascending=False)[:n_best]\n",
                "\n",
                "print(frequent_labels)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 9,
            "metadata": {},
            "outputs": [
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "Number of patients remaining in the database: \n",
                        "44045\n"
                    ]
                }
            ],
            "source": [
                "#Select entries whose drug name is in the list from the paper.\n",
                "drugs_list=['Acetaminophen', 'Aspirin','Bisacodyl','Insulin','Heparin','Docusate Sodium','D5W','Potassium Chloride','Magnesium Sulfate','Metoprolol Tartrate','Sodium Chloride 0.9%  Flush','Pantoprazole']\n",
                "presc2=presc.loc[presc['drug'].isin(drugs_list)]\n",
                "\n",
                "print('Number of patients remaining in the database: ')\n",
                "print(presc2['subject_id'].nunique())"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 10,
            "metadata": {},
            "outputs": [
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "drug                         dose_unit_rx\n",
                        "Acetaminophen                mg              108526\n",
                        "                             g                   25\n",
                        "                             gm                   1\n",
                        "Aspirin                      mg               40510\n",
                        "Bisacodyl                    mg               54841\n",
                        "D5W                          mL               28727\n",
                        "                             SYR                 31\n",
                        "                             ml                   8\n",
                        "                             BTL                  2\n",
                        "Docusate Sodium              mg               68021\n",
                        "                             mL                   1\n",
                        "Heparin                      UNIT             81700\n",
                        "                             units               81\n",
                        "                             Units/Liter          2\n",
                        "                             mg                   1\n",
                        "Insulin                      UNIT            222294\n",
                        "                             units                5\n",
                        "Magnesium Sulfate            gm              145797\n",
                        "                             mEq                 28\n",
                        "                             g                    1\n",
                        "                             mg                   1\n",
                        "Metoprolol Tartrate          mg              136834\n",
                        "                             mL                   1\n",
                        "Pantoprazole                 mg               38063\n",
                        "                             mL                   1\n",
                        "Potassium Chloride           mEq             238028\n",
                        "                             mmol                 3\n",
                        "                             mL                   1\n",
                        "                             mg                   1\n",
                        "Sodium Chloride 0.9%  Flush  mL              165655\n",
                        "                             ml                   3\n",
                        "Name: count, dtype: int64\n"
                    ]
                }
            ],
            "source": [
                "print(presc2.groupby('drug')['dose_unit_rx'].value_counts())"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 11,
            "metadata": {},
            "outputs": [
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "drug                         dose_unit_rx\n",
                        "Acetaminophen                mg              108526\n",
                        "Aspirin                      mg               40510\n",
                        "Bisacodyl                    mg               54841\n",
                        "D5W                          mL               28735\n",
                        "Docusate Sodium              mg               68021\n",
                        "Heparin                      UNIT             81700\n",
                        "Insulin                      UNIT            222294\n",
                        "Magnesium Sulfate            gm              145797\n",
                        "Metoprolol Tartrate          mg              136834\n",
                        "Pantoprazole                 mg               38063\n",
                        "Potassium Chloride           mEq             238028\n",
                        "Sodium Chloride 0.9%  Flush  mL              165658\n",
                        "Name: count, dtype: int64\n"
                    ]
                }
            ],
            "source": [
                "#Units correction\n",
                "presc2=presc2.drop(presc2.loc[presc2['dose_unit_rx'].isnull()].index).copy()\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='Acetaminophen')&(presc2['dose_unit_rx']!='mg')].index).copy()\n",
                "presc2.loc[(presc2['drug']=='D5W')&(presc2['dose_unit_rx']=='ml'),'dose_unit_rx']='mL'\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='D5W')&(presc2['dose_unit_rx']!='mL')].index).copy()\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='Heparin')&(presc2['dose_unit_rx']!='UNIT')].index).copy()\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='Insulin')&(presc2['dose_unit_rx']!='UNIT')].index).copy()\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='Magnesium Sulfate')&(presc2['dose_unit_rx']!='gm')].index).copy()\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='Potassium Chloride')&(presc2['dose_unit_rx']!='mEq')].index).copy()\n",
                "presc2.loc[(presc2['drug']=='Sodium Chloride 0.9%  Flush')&(presc2['dose_unit_rx']=='ml'),'dose_unit_rx']='mL'\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='Bisacodyl')&(presc2['dose_unit_rx']!='mg')].index).copy()\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='Pantoprazole')&(presc2['dose_unit_rx']!='mg')].index).copy()\n",
                "\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='Docusate Sodium')&(presc2['dose_unit_rx']!='mg')].index).copy()\n",
                "presc2=presc2.drop(presc2.loc[(presc2['drug']=='Metoprolol Tartrate')&(presc2['dose_unit_rx']!='mg')].index).copy()\n",
                "\n",
                "print(presc2.groupby('drug')['dose_unit_rx'].value_counts())"
            ]
        },
        {
            "attachments": {},
            "cell_type": "markdown",
            "metadata": {},
            "source": [
                "### Check for outliers\n",
                "\n",
                "#### 1) In amounts"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 13,
            "metadata": {},
            "outputs": [
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "Lost entries in the process : 245\n"
                    ]
                }
            ],
            "source": [
                "type(presc2[\"dose_val_rx\"])\n",
                "\n",
                "#We need to transform the value columns in float type.\n",
                "original_num_entries=len(presc2.index)\n",
                "\n",
                "presc2.dropna(subset=['dose_val_rx'], inplace=True)\n",
                "presc2.drop(presc2.loc[presc2['dose_val_rx'].str.contains(\"'\")].index, inplace=True)\n",
                "\n",
                "#First transform the ranges (xx-yy) as the mean of the ranges.\n",
                "range_df=presc2.loc[presc2[\"dose_val_rx\"].str.contains(\"-\")].copy()\n",
                "range_df[\"First_digit\"]=range_df[\"dose_val_rx\"].str.split(\"-\").str[0]\n",
                "range_df.loc[range_df[\"First_digit\"]==\"\",'First_digit'] = 0.0\n",
                "range_df[\"First_digit\"] = range_df[\"First_digit\"].astype(float)\n",
                "range_df[\"Second_digit\"]=range_df[\"dose_val_rx\"].str.split(\"-\").str[1]\n",
                "range_df.loc[range_df[\"Second_digit\"]==\"\",'Second_digit']=range_df.loc[range_df[\"Second_digit\"]==\"\",'First_digit']\n",
                "range_df[\"Second_digit\"]=range_df[\"Second_digit\"].astype(float)\n",
                "range_df[\"mean\"]=(range_df[\"First_digit\"]+range_df[\"Second_digit\"])/2\n",
                "range_df[\"dose_val_rx\"]=range_df[\"mean\"]\n",
                "range_df.drop(columns=[\"First_digit\",\"Second_digit\",\"mean\"],inplace=True)\n",
                "\n",
                "#Now remove the entries with the - from the original df and force conversion to float.\n",
                "presc3=presc2.drop(presc2.loc[presc2[\"dose_val_rx\"].str.contains(\"-\")].index).copy()\n",
                "presc3[\"dose_val_rx\"]=pd.to_numeric(presc2[\"dose_val_rx\"], errors=\"coerce\")\n",
                "presc3.dropna(subset=[\"dose_val_rx\"],inplace=True)\n",
                "\n",
                "presc2 = pd.concat([presc3, range_df], ignore_index=True)\n",
                "\n",
                "print(\"Lost entries in the process : {}\".format(original_num_entries-len(presc2.index)))\n"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 14,
            "metadata": {},
            "outputs": [],
            "source": [
                "#To avoid confounding labels with labels from other tables, we add 'drug' to the name\n",
                "presc2['charttime']=pd.to_datetime(presc2['starttime'], format='%Y-%m-%d %H:%M:%S')\n",
                "presc2['drug']=presc2['drug']+' Drug'"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 15,
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/html": [
                            "<div>\n",
                            "<style scoped>\n",
                            "    .dataframe tbody tr th:only-of-type {\n",
                            "        vertical-align: middle;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe tbody tr th {\n",
                            "        vertical-align: top;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe thead th {\n",
                            "        text-align: right;\n",
                            "    }\n",
                            "</style>\n",
                            "<table border=\"1\" class=\"dataframe\">\n",
                            "  <thead>\n",
                            "    <tr style=\"text-align: right;\">\n",
                            "      <th></th>\n",
                            "      <th>subject_id</th>\n",
                            "      <th>hadm_id</th>\n",
                            "      <th>pharmacy_id</th>\n",
                            "      <th>starttime</th>\n",
                            "      <th>stoptime</th>\n",
                            "      <th>drug_type</th>\n",
                            "      <th>drug</th>\n",
                            "      <th>gsn</th>\n",
                            "      <th>ndc</th>\n",
                            "      <th>prod_strength</th>\n",
                            "      <th>form_rx</th>\n",
                            "      <th>dose_val_rx</th>\n",
                            "      <th>dose_unit_rx</th>\n",
                            "      <th>form_val_disp</th>\n",
                            "      <th>form_unit_disp</th>\n",
                            "      <th>doses_per_24_hrs</th>\n",
                            "      <th>route</th>\n",
                            "      <th>charttime</th>\n",
                            "    </tr>\n",
                            "  </thead>\n",
                            "  <tbody>\n",
                            "    <tr>\n",
                            "      <th>0</th>\n",
                            "      <td>12315540</td>\n",
                            "      <td>23248664</td>\n",
                            "      <td>94413048</td>\n",
                            "      <td>2172-12-03 20:00:00</td>\n",
                            "      <td>2172-12-05 10:00:00</td>\n",
                            "      <td>MAIN</td>\n",
                            "      <td>Heparin Drug</td>\n",
                            "      <td>006549</td>\n",
                            "      <td>6.332303e+10</td>\n",
                            "      <td>5000 Units / mL- 1mL Vial</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>5000.0</td>\n",
                            "      <td>UNIT</td>\n",
                            "      <td>1</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>3.0</td>\n",
                            "      <td>SC</td>\n",
                            "      <td>2172-12-03 20:00:00</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>1</th>\n",
                            "      <td>12315540</td>\n",
                            "      <td>23248664</td>\n",
                            "      <td>68412815</td>\n",
                            "      <td>2172-12-03 23:00:00</td>\n",
                            "      <td>2172-12-04 22:00:00</td>\n",
                            "      <td>BASE</td>\n",
                            "      <td>D5W Drug</td>\n",
                            "      <td>001972</td>\n",
                            "      <td>4.097923e+08</td>\n",
                            "      <td>100mL Bag</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>100.0</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>100</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>1.0</td>\n",
                            "      <td>IV</td>\n",
                            "      <td>2172-12-03 23:00:00</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>2</th>\n",
                            "      <td>12315540</td>\n",
                            "      <td>23248664</td>\n",
                            "      <td>92297162</td>\n",
                            "      <td>2172-12-03 23:00:00</td>\n",
                            "      <td>2172-12-04 12:00:00</td>\n",
                            "      <td>BASE</td>\n",
                            "      <td>D5W Drug</td>\n",
                            "      <td>001972</td>\n",
                            "      <td>3.380017e+08</td>\n",
                            "      <td>250mL Bag</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>250.0</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>250</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>1.0</td>\n",
                            "      <td>IV</td>\n",
                            "      <td>2172-12-03 23:00:00</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>3</th>\n",
                            "      <td>12315540</td>\n",
                            "      <td>23248664</td>\n",
                            "      <td>47490519</td>\n",
                            "      <td>2172-12-03 23:00:00</td>\n",
                            "      <td>2172-12-04 12:00:00</td>\n",
                            "      <td>BASE</td>\n",
                            "      <td>D5W Drug</td>\n",
                            "      <td>001972</td>\n",
                            "      <td>3.380017e+08</td>\n",
                            "      <td>250mL Bag</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>250.0</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>250</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>1.0</td>\n",
                            "      <td>IV</td>\n",
                            "      <td>2172-12-03 23:00:00</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>4</th>\n",
                            "      <td>12315540</td>\n",
                            "      <td>23248664</td>\n",
                            "      <td>34102962</td>\n",
                            "      <td>2172-12-04 11:00:00</td>\n",
                            "      <td>2172-12-05 10:00:00</td>\n",
                            "      <td>BASE</td>\n",
                            "      <td>D5W Drug</td>\n",
                            "      <td>001972</td>\n",
                            "      <td>3.380017e+08</td>\n",
                            "      <td>50mL Bag</td>\n",
                            "      <td>NaN</td>\n",
                            "      <td>50.0</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>50</td>\n",
                            "      <td>mL</td>\n",
                            "      <td>1.0</td>\n",
                            "      <td>IV</td>\n",
                            "      <td>2172-12-04 11:00:00</td>\n",
                            "    </tr>\n",
                            "  </tbody>\n",
                            "</table>\n",
                            "</div>"
                        ],
                        "text/plain": [
                            "   subject_id   hadm_id  pharmacy_id            starttime  \\\n",
                            "0    12315540  23248664     94413048  2172-12-03 20:00:00   \n",
                            "1    12315540  23248664     68412815  2172-12-03 23:00:00   \n",
                            "2    12315540  23248664     92297162  2172-12-03 23:00:00   \n",
                            "3    12315540  23248664     47490519  2172-12-03 23:00:00   \n",
                            "4    12315540  23248664     34102962  2172-12-04 11:00:00   \n",
                            "\n",
                            "              stoptime drug_type          drug     gsn           ndc  \\\n",
                            "0  2172-12-05 10:00:00      MAIN  Heparin Drug  006549  6.332303e+10   \n",
                            "1  2172-12-04 22:00:00      BASE      D5W Drug  001972  4.097923e+08   \n",
                            "2  2172-12-04 12:00:00      BASE      D5W Drug  001972  3.380017e+08   \n",
                            "3  2172-12-04 12:00:00      BASE      D5W Drug  001972  3.380017e+08   \n",
                            "4  2172-12-05 10:00:00      BASE      D5W Drug  001972  3.380017e+08   \n",
                            "\n",
                            "               prod_strength form_rx  dose_val_rx dose_unit_rx form_val_disp  \\\n",
                            "0  5000 Units / mL- 1mL Vial     NaN       5000.0         UNIT             1   \n",
                            "1                  100mL Bag     NaN        100.0           mL           100   \n",
                            "2                  250mL Bag     NaN        250.0           mL           250   \n",
                            "3                  250mL Bag     NaN        250.0           mL           250   \n",
                            "4                   50mL Bag     NaN         50.0           mL            50   \n",
                            "\n",
                            "  form_unit_disp  doses_per_24_hrs route           charttime  \n",
                            "0             mL               3.0    SC 2172-12-03 20:00:00  \n",
                            "1             mL               1.0    IV 2172-12-03 23:00:00  \n",
                            "2             mL               1.0    IV 2172-12-03 23:00:00  \n",
                            "3             mL               1.0    IV 2172-12-03 23:00:00  \n",
                            "4             mL               1.0    IV 2172-12-04 11:00:00  "
                        ]
                    },
                    "execution_count": 15,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "presc2.head()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 16,
            "metadata": {},
            "outputs": [],
            "source": [
                "presc2.to_csv(path_temp + '/processed/prescriptions_processed.csv')"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "metadata": {},
            "outputs": [],
            "source": []
        }
    ],
    "metadata": {
        "kernelspec": {
            "display_name": "Python 3 (ipykernel)",
            "language": "python",
            "name": "python3"
        },
        "language_info": {
            "codemirror_mode": {
                "name": "ipython",
                "version": 3
            },
            "file_extension": ".py",
            "mimetype": "text/x-python",
            "name": "python",
            "nbconvert_exporter": "python",
            "pygments_lexer": "ipython3",
            "version": "3.8.12"
        },
        "vscode": {
            "interpreter": {
                "hash": "5ae865abb88ad0a991db65fb0a3113ce9d7dd5f50b65ef8b203d3356ff36831c"
            }
        }
    },
    "nbformat": 4,
    "nbformat_minor": 4
}
