{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "try:\n",
    "    import cPickle as pickle\n",
    "except ImportError:\n",
    "    import _pickle as pickle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "disc_inp_data = pd.read_csv('./data/mimictable.csv')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "the reward function,  we don't care about terminal reward, but we care about mid-reward"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# ## nature 2017 Raghu et. al. reward function\n",
    "# # add rewards\n",
    "# c0 = -0.25\n",
    "# c1 = -0.75\n",
    "# c2 = -0.5\n",
    "# disc_inp_data['reward'] = 0\n",
    "# for i in disc_inp_data.index:\n",
    "#     if i == 0:\n",
    "#         continue\n",
    "#     if disc_inp_data.loc[i, 'icustayid'] == disc_inp_data.loc[i-1, 'icustayid']:\n",
    "#         sofa_cur = disc_inp_data.loc[i,'SOFA']\n",
    "#         sofa_prev = disc_inp_data.loc[i-1,'SOFA']\n",
    "#         lact_cur = disc_inp_data.loc[i,'Arterial_lactate']\n",
    "#         lact_prev = disc_inp_data.loc[i-1,'Arterial_lactate']\n",
    "#         reward = 0\n",
    "#         if sofa_cur == sofa_prev and sofa_cur != 0:\n",
    "#             reward += c0\n",
    "#         reward += c1*(sofa_cur-sofa_prev)\n",
    "#         reward += c2*np.tanh(lact_cur - lact_prev)\n",
    "#         disc_inp_data.loc[i-1,'reward'] = reward\n",
    "\n",
    "# if disc_inp_data.loc[len(disc_inp_data)-1, 'died_in_hosp'] == 1:\n",
    "#     disc_inp_data.loc[len(disc_inp_data)-1, 'reward'] = -15\n",
    "# elif disc_inp_data.loc[len(disc_inp_data)-1, 'died_in_hosp'] == 0:\n",
    "#      disc_inp_data.loc[len(disc_inp_data)-1, 'reward'] = 15"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 2022 huang et. al. reward function\n",
    "disc_inp_data['reward'] = 0\n",
    "# add rewards\n",
    "c0 = -0.25\n",
    "c1 = -0.2\n",
    "for i in disc_inp_data.index:\n",
    "    if i == 0:\n",
    "        continue\n",
    "    if disc_inp_data.loc[i, 'icustayid'] == disc_inp_data.loc[i-1, 'icustayid']:\n",
    "        sofa_cur = disc_inp_data.loc[i,'SOFA']\n",
    "        sofa_prev = disc_inp_data.loc[i-1,'SOFA']\n",
    "        reward = 0\n",
    "        reward += c0*np.tanh(sofa_prev-6)\n",
    "        reward += c1*(sofa_cur - sofa_prev)\n",
    "        disc_inp_data.loc[i-1,'reward'] += reward"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "normalization reward [0,1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "minimum = min(disc_inp_data['reward'])\n",
    "maximum = max(disc_inp_data['reward'])\n",
    "disc_inp_data['reward'] = (disc_inp_data['reward'] - minimum)/(maximum-minimum)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-3.5500030720873013 2.950000001030577\n"
     ]
    }
   ],
   "source": [
    "print(minimum,maximum)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Normalized data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "orig_data = disc_inp_data.copy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "binary_fields = ['gender','mechvent','re_admission']\n",
    "norm_fields= ['age','Weight_kg','GCS','HR','SysBP','MeanBP','DiaBP','RR','Temp_C','FiO2_1',\n",
    "    'Potassium','Sodium','Chloride','Glucose','Magnesium','Calcium',\n",
    "    'Hb','WBC_count','Platelets_count','PTT','PT','Arterial_pH','paO2','paCO2',\n",
    "    'Arterial_BE','HCO3','Arterial_lactate','SOFA','SIRS','Shock_Index',\n",
    "    'PaO2_FiO2', 'elixhauser', 'Albumin', u'CO2_mEqL', 'Ionised_Ca']\n",
    "log_fields = ['SpO2','BUN','Creatinine','SGOT','SGPT','Total_bili','INR',\n",
    "            'output_total','output_4hourly', 'bloc']\n",
    "# binary_fields = ['gender','mechvent','re_admission']\n",
    "# norm_fields= ['age','Weight_kg','GCS','HR','SysBP','MeanBP','DiaBP','RR','Temp_C','FiO2_1',\n",
    "#     'Potassium','Sodium','Chloride','Glucose','Magnesium','Calcium',\n",
    "#     'Hb','WBC_count','Platelets_count','PTT','PT','Arterial_pH','paO2','paCO2',\n",
    "#     'Arterial_BE','HCO3','Arterial_lactate',\n",
    "#     'PaO2_FiO2', u'CO2_mEqL', 'Ionised_Ca']\n",
    "# log_fields = ['SpO2','BUN','Creatinine','SGOT','SGPT','Total_bili','INR']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "norm_fields_av = []\n",
    "norm_fields_std = []\n",
    "log_fields_av = []\n",
    "log_fields_std = []\n",
    "# normalise binary fields\n",
    "disc_inp_data[binary_fields] = disc_inp_data[binary_fields] - 0.5 \n",
    "# normal distn fields\n",
    "for item in norm_fields:\n",
    "    av = disc_inp_data[item].mean()\n",
    "    std = disc_inp_data[item].std()\n",
    "    disc_inp_data[item] = (disc_inp_data[item] - av) / std\n",
    "    norm_fields_av.append(av)\n",
    "    norm_fields_std.append(std)\n",
    "# log normal fields、\n",
    "disc_inp_data[log_fields] = np.log(0.1 + disc_inp_data[log_fields])\n",
    "for item in log_fields:\n",
    "    av = disc_inp_data[item].mean()\n",
    "    std = disc_inp_data[item].std()\n",
    "    disc_inp_data[item] = (disc_inp_data[item] - av) / std\n",
    "    log_fields_av.append(av)\n",
    "    log_fields_std.append(std)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "dfn=pd.DataFrame(columns=norm_fields)\n",
    "dfn.loc[0] = norm_fields_av\n",
    "dfn.loc[1] = norm_fields_std\n",
    "dfd=pd.DataFrame(columns=log_fields)\n",
    "dfd.loc[0] = log_fields_av\n",
    "dfd.loc[1] = log_fields_std"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# # normalise binary fields\n",
    "# disc_inp_data[binary_fields] = disc_inp_data[binary_fields] + 0.5 \n",
    "# # normal distn fields\n",
    "# for item in norm_fields:\n",
    "#     av = dfn.loc[0,item]\n",
    "#     std = dfn.loc[1,item]\n",
    "#     disc_inp_data[item] = disc_inp_data[item]*std + av\n",
    "# # log normal fields、\n",
    "# for item in log_fields:\n",
    "#     av = dfd.loc[0,item]\n",
    "#     std = dfd.loc[1,item]\n",
    "#     disc_inp_data[item] = disc_inp_data[item]*std + av\n",
    "# # 修改\n",
    "# disc_inp_data[log_fields] = np.exp(disc_inp_data[log_fields])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "# with open('df_norm.csv','wb') as f:  \n",
    "#     pickle.dump(dfn,f)\n",
    "# with open('df_log.csv','wb') as f:  \n",
    "#     pickle.dump(dfd,f)\n",
    "dfn.to_csv('df_norm.csv')\n",
    "dfd.to_csv('df_log.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "# scale features to [0,1] in train set, similar in val and test\n",
    "import copy\n",
    "scalable_fields = copy.deepcopy(binary_fields)\n",
    "scalable_fields.extend(norm_fields)\n",
    "scalable_fields.extend(log_fields)\n",
    "dmin = []\n",
    "dmax = []\n",
    "for col in scalable_fields:\n",
    "    minimum = min(disc_inp_data[col])\n",
    "    maximum = max(disc_inp_data[col])\n",
    "    disc_inp_data[col] = (disc_inp_data[col] - minimum)/(maximum-minimum)\n",
    "    dmin.append(minimum)\n",
    "    dmax.append(maximum)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "dfminmax=pd.DataFrame(columns=scalable_fields)\n",
    "dfminmax.loc[0] = dmin\n",
    "dfminmax.loc[1] = dmax\n",
    "dfminmax.to_csv('dfminmax.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# for col in scalable_fields:\n",
    "#     minimum = dfminmax.loc[0,col]\n",
    "#     maximum = dfminmax.loc[1,col]\n",
    "#     disc_inp_data[col] = disc_inp_data[col]*(maximum-minimum)+minimum"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "disc_inp_data['iv_input'] = orig_data['input_4hourly']\n",
    "disc_inp_data['vaso_input'] = orig_data['max_dose_vaso']"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Obtain expert data based on whether the patient died or not (data indicating that the patient ultimately did not die)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "expert_data = disc_inp_data[disc_inp_data['died_in_hosp']==0]\n",
    "#expert_data = disc_inp_data#"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "filtered_rows = expert_data[(expert_data['iv_input'] > 2000) | (expert_data['vaso_input'] >1)]\n",
    "\n",
    "\n",
    "unique_ids = filtered_rows['icustayid'].unique()\n",
    "\n",
    "\n",
    "df_result = expert_data[~expert_data['icustayid'].isin(unique_ids)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "16942 11859 5083\n"
     ]
    }
   ],
   "source": [
    "# now split into train/validation/test sets\n",
    "import random\n",
    "unique_ids = df_result['icustayid'].unique()\n",
    "random.shuffle(unique_ids)\n",
    "train_sample = 0.7\n",
    "test_sample = 0.3\n",
    "train_num = int(len(unique_ids) * train_sample)\n",
    "test_num = int(len(unique_ids) * (test_sample+train_sample))\n",
    "train_ids_expert = unique_ids[:train_num]\n",
    "val_ids_expert = unique_ids[train_num:]\n",
    "print(len(unique_ids),len(train_ids_expert),len(val_ids_expert))\n",
    "from pandas import DataFrame\n",
    "train_set_expert = DataFrame()\n",
    "train_set_expert = df_result.loc[df_result['icustayid'].isin(train_ids_expert)]\n",
    "\n",
    "val_set_expert = DataFrame()\n",
    "val_set_expert = df_result.loc[df_result['icustayid'].isin(val_ids_expert)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [],
   "source": [
    "#train_set_expert.to_csv('./expert_data_train.csv',index=False)\n",
    "val_set_expert.to_csv('./expert_data_val.csv',index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>bloc</th>\n",
       "      <th>icustayid</th>\n",
       "      <th>charttime</th>\n",
       "      <th>gender</th>\n",
       "      <th>age</th>\n",
       "      <th>elixhauser</th>\n",
       "      <th>re_admission</th>\n",
       "      <th>died_in_hosp</th>\n",
       "      <th>died_within_48h_of_out_time</th>\n",
       "      <th>mortality_90d</th>\n",
       "      <th>...</th>\n",
       "      <th>input_total</th>\n",
       "      <th>input_4hourly</th>\n",
       "      <th>output_total</th>\n",
       "      <th>output_4hourly</th>\n",
       "      <th>cumulated_balance</th>\n",
       "      <th>SOFA</th>\n",
       "      <th>SIRS</th>\n",
       "      <th>reward</th>\n",
       "      <th>iv_input</th>\n",
       "      <th>vaso_input</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>0.000000</td>\n",
       "      <td>12.0</td>\n",
       "      <td>5.805732e+09</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.203974</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>...</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.166667</td>\n",
       "      <td>0.50</td>\n",
       "      <td>0.583232</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>0.222560</td>\n",
       "      <td>12.0</td>\n",
       "      <td>5.805746e+09</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.203974</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>...</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.166667</td>\n",
       "      <td>0.50</td>\n",
       "      <td>0.706309</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>0.356608</td>\n",
       "      <td>12.0</td>\n",
       "      <td>5.805761e+09</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.203974</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>...</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.584931</td>\n",
       "      <td>0.736242</td>\n",
       "      <td>-650.0</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.75</td>\n",
       "      <td>0.553846</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>0.452837</td>\n",
       "      <td>12.0</td>\n",
       "      <td>5.805775e+09</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.203974</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>...</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.625773</td>\n",
       "      <td>0.722235</td>\n",
       "      <td>-1200.0</td>\n",
       "      <td>0.041667</td>\n",
       "      <td>0.50</td>\n",
       "      <td>0.546154</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>0.000000</td>\n",
       "      <td>30.0</td>\n",
       "      <td>5.707739e+09</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.492928</td>\n",
       "      <td>0.428571</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>...</td>\n",
       "      <td>9199.0</td>\n",
       "      <td>71.0</td>\n",
       "      <td>0.717290</td>\n",
       "      <td>0.697606</td>\n",
       "      <td>4459.0</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.50</td>\n",
       "      <td>0.492307</td>\n",
       "      <td>71.0</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5 rows × 62 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        bloc  icustayid     charttime  gender       age  elixhauser  \\\n",
       "19  0.000000       12.0  5.805732e+09     1.0  0.203974    0.000000   \n",
       "20  0.222560       12.0  5.805746e+09     1.0  0.203974    0.000000   \n",
       "21  0.356608       12.0  5.805761e+09     1.0  0.203974    0.000000   \n",
       "22  0.452837       12.0  5.805775e+09     1.0  0.203974    0.000000   \n",
       "34  0.000000       30.0  5.707739e+09     0.0  0.492928    0.428571   \n",
       "\n",
       "    re_admission  died_in_hosp  died_within_48h_of_out_time  mortality_90d  \\\n",
       "19           0.0           0.0                          0.0            0.0   \n",
       "20           0.0           0.0                          0.0            0.0   \n",
       "21           0.0           0.0                          0.0            0.0   \n",
       "22           0.0           0.0                          0.0            0.0   \n",
       "34           0.0           0.0                          0.0            0.0   \n",
       "\n",
       "    ...  input_total  input_4hourly  output_total  output_4hourly  \\\n",
       "19  ...          0.0            0.0      0.000000        0.000000   \n",
       "20  ...          0.0            0.0      0.000000        0.000000   \n",
       "21  ...          0.0            0.0      0.584931        0.736242   \n",
       "22  ...          0.0            0.0      0.625773        0.722235   \n",
       "34  ...       9199.0           71.0      0.717290        0.697606   \n",
       "\n",
       "    cumulated_balance      SOFA  SIRS    reward  iv_input  vaso_input  \n",
       "19                0.0  0.166667  0.50  0.583232       0.0         0.0  \n",
       "20                0.0  0.166667  0.50  0.706309       0.0         0.0  \n",
       "21             -650.0  0.000000  0.75  0.553846       0.0         0.0  \n",
       "22            -1200.0  0.041667  0.50  0.546154       0.0         0.0  \n",
       "34             4459.0  0.000000  0.50  0.492307      71.0         0.0  \n",
       "\n",
       "[5 rows x 62 columns]"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "val_set_expert.head()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "patient number——train dataset:test dataset:val dataset = 7:2:1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# now split into train/validation/test sets\n",
    "import random\n",
    "unique_ids = disc_inp_data['icustayid'].unique()\n",
    "random.shuffle(unique_ids)\n",
    "train_sample = 0.7\n",
    "test_sample = 0.2\n",
    "val_sample = 0.1\n",
    "train_num = int(len(unique_ids) * train_sample)\n",
    "test_num = int(len(unique_ids) * (test_sample+train_sample))\n",
    "train_ids = unique_ids[:train_num]\n",
    "test_ids = unique_ids[train_num:test_num]\n",
    "val_ids = unique_ids[test_num:]\n",
    "print(len(unique_ids),len(train_ids),len(val_ids),len(test_ids))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from pandas import DataFrame\n",
    "train_set = DataFrame()\n",
    "train_set = disc_inp_data.loc[disc_inp_data['icustayid'].isin(train_ids)]\n",
    "\n",
    "val_set = DataFrame()\n",
    "val_set = disc_inp_data.loc[disc_inp_data['icustayid'].isin(val_ids)]\n",
    "\n",
    "test_set = DataFrame()\n",
    "test_set = disc_inp_data.loc[disc_inp_data['icustayid'].isin(test_ids)]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "expert data,train data,test data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_set.to_csv('./train_data_iv1.csv',index=False)\n",
    "val_set.to_csv('./val_data_iv1.csv', index=False)\n",
    "test_set.to_csv('./test_data_iv1.csv', index=False)\n",
    "df_result.to_csv('./expert_data_iv1.csv',index=False)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "py38",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.17"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
