{
    "cells": [
        {
            "cell_type": "code",
            "execution_count": 2,
            "id": "0e16786e",
            "metadata": {},
            "outputs": [],
            "source": [
                "import os\n",
                "from pathlib import Path\n",
                "import numpy as np\n",
                "import pandas as pd\n",
                "from datetime import timedelta\n",
                "\n",
                "# p_project = Path(__file__).parents[2]\n",
                "p_project = Path(os.getcwd()).parents[1]\n",
                "path_m4 = p_project/'data/mimic4'"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 3,
            "id": "c8c64cf0",
            "metadata": {},
            "outputs": [
                {
                    "name": "stderr",
                    "output_type": "stream",
                    "text": [
                        "/tmp/ipykernel_48934/511566662.py:3: DtypeWarning: Columns (12) have mixed types. Specify dtype option on import or set low_memory=False.\n",
                        "  inputs_df = pd.read_csv(path_m4/'processed/inputs_processed.csv')[\n",
                        "/tmp/ipykernel_48934/511566662.py:7: DtypeWarning: Columns (8,11,14) have mixed types. Specify dtype option on import or set low_memory=False.\n",
                        "  presc_df = pd.read_csv(path_m4/'processed/prescriptions_processed.csv')[\n"
                    ]
                }
            ],
            "source": [
                "lab_df = pd.read_csv(path_m4/'processed/lab_processed.csv')[\n",
                "    ['subject_id', 'hadm_id', 'charttime', 'valuenum', 'label']]\n",
                "inputs_df = pd.read_csv(path_m4/'processed/inputs_processed.csv')[\n",
                "    ['subject_id', 'hadm_id', 'charttime', 'amount', 'label']]\n",
                "outputs_df = pd.read_csv(path_m4/'processed/outputs_processed.csv')[\n",
                "    ['subject_id', 'hadm_id', 'charttime', 'value', 'label']]\n",
                "presc_df = pd.read_csv(path_m4/'processed/prescriptions_processed.csv')[\n",
                "    ['subject_id', 'hadm_id', 'charttime', 'dose_val_rx', 'drug']]\n",
                "\n",
                "# Change the name of amount. Valuenum for every table\n",
                "inputs_df['valuenum'] = inputs_df['amount']\n",
                "inputs_df = inputs_df.drop(columns=['amount']).copy()\n",
                "\n",
                "outputs_df['valuenum'] = outputs_df['value']\n",
                "outputs_df = outputs_df.drop(columns=['value']).copy()\n",
                "\n",
                "presc_df['valuenum'] = presc_df['dose_val_rx']\n",
                "presc_df = presc_df.drop(columns=['dose_val_rx']).copy()\n",
                "presc_df['label'] = presc_df['drug']\n",
                "presc_df = presc_df.drop(columns=['drug']).copy()\n",
                "\n",
                "# Tag to distinguish between lab and inputs events\n",
                "inputs_df['Origin'] = 'Inputs'\n",
                "lab_df['Origin'] = 'Lab'\n",
                "outputs_df['Origin'] = 'Outputs'\n",
                "presc_df['Origin'] = 'Prescriptions'\n",
                "\n",
                "merged_df = pd.concat((inputs_df, lab_df, outputs_df, presc_df)).reset_index()\n",
                "\n",
                "# Check that all labels have different names.\n",
                "assert(merged_df['label'].nunique() == (inputs_df['label'].nunique(\n",
                ")+lab_df['label'].nunique()+outputs_df['label'].nunique()+presc_df['label'].nunique()))"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 28,
            "id": "95861979",
            "metadata": {},
            "outputs": [
                {
                    "name": "stderr",
                    "output_type": "stream",
                    "text": [
                        "/tmp/ipykernel_48934/319180892.py:44: FutureWarning: The provided callable <function max at 0x7fe8a8169870> is currently using DataFrameGroupBy.max. In a future version of pandas, the provided callable will be used directly. To keep current behavior pass the string \"max\" instead.\n",
                        "  value_df = pd.pivot_table(merged_df_short, values='valuenum', index=[\n"
                    ]
                },
                {
                    "data": {
                        "text/html": [
                            "<div>\n",
                            "<style scoped>\n",
                            "    .dataframe tbody tr th:only-of-type {\n",
                            "        vertical-align: middle;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe tbody tr th {\n",
                            "        vertical-align: top;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe thead th {\n",
                            "        text-align: right;\n",
                            "    }\n",
                            "</style>\n",
                            "<table border=\"1\" class=\"dataframe\">\n",
                            "  <thead>\n",
                            "    <tr style=\"text-align: right;\">\n",
                            "      <th>label_code</th>\n",
                            "      <th>ID</th>\n",
                            "      <th>Time</th>\n",
                            "      <th>Value_0</th>\n",
                            "      <th>Value_1</th>\n",
                            "      <th>Value_2</th>\n",
                            "      <th>Value_3</th>\n",
                            "      <th>Value_4</th>\n",
                            "      <th>Value_5</th>\n",
                            "      <th>Value_6</th>\n",
                            "      <th>Value_7</th>\n",
                            "      <th>...</th>\n",
                            "      <th>Mask_86</th>\n",
                            "      <th>Mask_87</th>\n",
                            "      <th>Mask_88</th>\n",
                            "      <th>Mask_89</th>\n",
                            "      <th>Mask_90</th>\n",
                            "      <th>Mask_91</th>\n",
                            "      <th>Mask_92</th>\n",
                            "      <th>Mask_93</th>\n",
                            "      <th>Mask_94</th>\n",
                            "      <th>Mask_95</th>\n",
                            "    </tr>\n",
                            "  </thead>\n",
                            "  <tbody>\n",
                            "    <tr>\n",
                            "      <th>0</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.000000</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>1</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>578</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.000000</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>2</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>599</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.000000</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>3</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>693</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.000000</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>4</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>720</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.000000</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>...</th>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "      <td>...</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>5669787</th>\n",
                            "      <td>29999828</td>\n",
                            "      <td>2774</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>61.849996</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>5669788</th>\n",
                            "      <td>29999828</td>\n",
                            "      <td>2804</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>61.849996</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>5669789</th>\n",
                            "      <td>29999828</td>\n",
                            "      <td>2820</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.000000</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>5669790</th>\n",
                            "      <td>29999828</td>\n",
                            "      <td>2834</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>61.849996</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>5669791</th>\n",
                            "      <td>29999828</td>\n",
                            "      <td>2864</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>61.849996</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "  </tbody>\n",
                            "</table>\n",
                            "<p>5669792 rows × 194 columns</p>\n",
                            "</div>"
                        ],
                        "text/plain": [
                            "label_code        ID  Time  Value_0  Value_1  Value_2  Value_3  Value_4  \\\n",
                            "0           20000147     0      0.0      0.0      0.0      0.0      0.0   \n",
                            "1           20000147   578      0.0      0.0      0.0      0.0      0.0   \n",
                            "2           20000147   599      0.0      0.0      0.0      0.0      0.0   \n",
                            "3           20000147   693      0.0      0.0      0.0      0.0      0.0   \n",
                            "4           20000147   720      0.0      0.0      0.0      0.0      0.0   \n",
                            "...              ...   ...      ...      ...      ...      ...      ...   \n",
                            "5669787     29999828  2774      0.0      0.0      0.0      0.0      0.0   \n",
                            "5669788     29999828  2804      0.0      0.0      0.0      0.0      0.0   \n",
                            "5669789     29999828  2820      0.0      0.0      0.0      0.0      0.0   \n",
                            "5669790     29999828  2834      0.0      0.0      0.0      0.0      0.0   \n",
                            "5669791     29999828  2864      0.0      0.0      0.0      0.0      0.0   \n",
                            "\n",
                            "label_code  Value_5    Value_6  Value_7  ...  Mask_86  Mask_87  Mask_88  \\\n",
                            "0               0.0   0.000000      0.0  ...        0        0        0   \n",
                            "1               0.0   0.000000      0.0  ...        0        0        0   \n",
                            "2               0.0   0.000000      0.0  ...        0        0        0   \n",
                            "3               0.0   0.000000      0.0  ...        0        0        0   \n",
                            "4               0.0   0.000000      0.0  ...        0        0        0   \n",
                            "...             ...        ...      ...  ...      ...      ...      ...   \n",
                            "5669787         0.0  61.849996      0.0  ...        0        0        0   \n",
                            "5669788         0.0  61.849996      0.0  ...        0        0        0   \n",
                            "5669789         0.0   0.000000      0.0  ...        0        0        0   \n",
                            "5669790         0.0  61.849996      0.0  ...        0        0        0   \n",
                            "5669791         0.0  61.849996      0.0  ...        0        0        0   \n",
                            "\n",
                            "label_code  Mask_89  Mask_90  Mask_91  Mask_92  Mask_93  Mask_94  Mask_95  \n",
                            "0                 0        0        0        0        0        0        0  \n",
                            "1                 0        0        0        0        0        0        0  \n",
                            "2                 0        0        0        0        0        0        0  \n",
                            "3                 0        0        0        0        0        0        0  \n",
                            "4                 0        0        0        0        0        0        0  \n",
                            "...             ...      ...      ...      ...      ...      ...      ...  \n",
                            "5669787           0        0        0        0        0        0        0  \n",
                            "5669788           0        0        0        0        0        0        0  \n",
                            "5669789           0        0        0        0        0        0        0  \n",
                            "5669790           0        0        0        0        0        0        0  \n",
                            "5669791           0        0        0        0        0        0        0  \n",
                            "\n",
                            "[5669792 rows x 194 columns]"
                        ]
                    },
                    "execution_count": 28,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "# set the timestamp as the time delta between the first chart time for each admission\n",
                "merged_df['charttime'] = pd.to_datetime(\n",
                "    merged_df['charttime'], format='%Y-%m-%d %H:%M:%S')\n",
                "ref_time = merged_df.groupby('hadm_id')['charttime'].min()\n",
                "merged_df_1 = pd.merge(ref_time.to_frame(name='ref_time'),\n",
                "                       merged_df, left_index=True, right_on='hadm_id')\n",
                "merged_df_1['time_stamp'] = merged_df_1['charttime']-merged_df_1['ref_time']\n",
                "assert(len(merged_df_1.loc[merged_df_1['time_stamp']\n",
                "       < timedelta(hours=0)].index) == 0)\n",
                "\n",
                "# Create a label code (int) for the labels.\n",
                "label_dict = dict(zip(list(merged_df_1['label'].unique()), range(\n",
                "    len(list(merged_df_1['label'].unique())))))\n",
                "merged_df_1['label_code'] = merged_df_1['label'].map(label_dict)\n",
                "\n",
                "label_dict_df = pd.Series(merged_df_1['label'].unique()).reset_index()\n",
                "label_dict_df.columns = ['index', 'label']\n",
                "label_dict_df['label_code'] = label_dict_df['label'].map(label_dict)\n",
                "label_dict_df.drop(columns=['index'], inplace=True)\n",
                "label_dict_df.to_csv(path_m4/'processed/variable_name_dict.csv')\n",
                "\n",
                "merged_df_short = merged_df_1[['hadm_id', 'valuenum', 'time_stamp', 'label_code']].rename(\n",
                "    columns={'hadm_id': 'ID', 'time_stamp': 'Time'})\n",
                "\n",
                "# select patients who have records in both the first 24 hours and the second 24 hours\n",
                "ids_before_24 = merged_df_short.loc[(\n",
                "    merged_df_short['Time'] < timedelta(hours=24))]['ID'].unique()\n",
                "\n",
                "ids_after_24 = merged_df_short.loc[(merged_df_short['Time'] >= timedelta(hours=24)) &\n",
                "                                   (merged_df_short['Time'] < timedelta(hours=48))]['ID'].unique()\n",
                "\n",
                "merged_df_short = merged_df_short.loc[merged_df_short['ID'].isin(\n",
                "    set(ids_before_24) & set(ids_after_24))]\n",
                "\n",
                "# select 48h records\n",
                "merged_df_short = merged_df_short.loc[merged_df_short['Time'] < timedelta(\n",
                "    hours=48)]\n",
                "\n",
                "# The sampling interval is 1 minute\n",
                "merged_df_short['Time'] = merged_df_short['Time'].dt.total_seconds().div(\n",
                "    60).astype(int)\n",
                "assert(len(merged_df_short.loc[merged_df_short['Time'] > 2880].index) == 0)\n",
                "\n",
                "value_df = pd.pivot_table(merged_df_short, values='valuenum', index=[\n",
                "                          'ID', 'Time'], columns=['label_code'], aggfunc=np.max)\n",
                "mask_df = value_df.notna()\n",
                "\n",
                "d_values = {}\n",
                "d_masks = {}\n",
                "for i in value_df.columns:\n",
                "    d_values[i] = \"Value_\" + str(i)\n",
                "    d_masks[i] = \"Mask_\" + str(i)\n",
                "\n",
                "value_df.rename(columns=d_values, inplace=True)\n",
                "mask_df.rename(columns=d_masks, inplace=True)\n",
                "\n",
                "value_df.fillna(0, inplace=True)\n",
                "mask_df = mask_df.astype(int)\n",
                "\n",
                "complete_df = pd.concat((value_df, mask_df), axis=1).reset_index()\n",
                "\n",
                "complete_df['ID'] = complete_df['ID'].astype(int)\n",
                "\n",
                "complete_df.sort_values([\"ID\", \"Time\"], inplace=True)\n",
                "\n",
                "complete_df\n"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "id": "0190afa5",
            "metadata": {},
            "outputs": [
                {
                    "ename": "AttributeError",
                    "evalue": "module 'pandas' has no attribute 'to_csv'",
                    "output_type": "error",
                    "traceback": [
                        "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
                        "\u001b[0;31mAttributeError\u001b[0m                            Traceback (most recent call last)",
                        "\u001b[1;32m/home/hdu24/wkw/ivpvae-main/ivpvae-main/preprocess/pre_mimic4/datamerging.ipynb 单元格 4\u001b[0m line \u001b[0;36m1\n\u001b[0;32m----> <a href='vscode-notebook-cell://ssh-remote%2B10.25.10.45/home/hdu24/wkw/ivpvae-main/ivpvae-main/preprocess/pre_mimic4/datamerging.ipynb#W3sdnNjb2RlLXJlbW90ZQ%3D%3D?line=0'>1</a>\u001b[0m complete_df \u001b[39m=\u001b[39m pd\u001b[39m.\u001b[39;49mto_csv(path_m4\u001b[39m/\u001b[39m\u001b[39m'\u001b[39m\u001b[39mprocessed/mimic4_full_dataset.csv\u001b[39m\u001b[39m'\u001b[39m, index_col\u001b[39m=\u001b[39m\u001b[39m0\u001b[39m)\n",
                        "\u001b[0;31mAttributeError\u001b[0m: module 'pandas' has no attribute 'to_csv'"
                    ]
                }
            ],
            "source": [
                "complete_df = pd.read_csv(path_m4/'processed/mimic4_full_dataset.csv', index_col=0)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "id": "e964afc9",
            "metadata": {},
            "outputs": [],
            "source": []
        },
        {
            "cell_type": "code",
            "execution_count": 5,
            "id": "7c173967",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/html": [
                            "<div>\n",
                            "<style scoped>\n",
                            "    .dataframe tbody tr th:only-of-type {\n",
                            "        vertical-align: middle;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe tbody tr th {\n",
                            "        vertical-align: top;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe thead th {\n",
                            "        text-align: right;\n",
                            "    }\n",
                            "</style>\n",
                            "<table border=\"1\" class=\"dataframe\">\n",
                            "  <thead>\n",
                            "    <tr style=\"text-align: right;\">\n",
                            "      <th>label_code</th>\n",
                            "      <th>ID</th>\n",
                            "      <th>Time</th>\n",
                            "      <th>Value_0</th>\n",
                            "      <th>Value_1</th>\n",
                            "      <th>Value_2</th>\n",
                            "      <th>Value_3</th>\n",
                            "      <th>Value_4</th>\n",
                            "      <th>Value_5</th>\n",
                            "      <th>Value_6</th>\n",
                            "      <th>Value_7</th>\n",
                            "      <th>...</th>\n",
                            "      <th>Mask_86</th>\n",
                            "      <th>Mask_87</th>\n",
                            "      <th>Mask_88</th>\n",
                            "      <th>Mask_89</th>\n",
                            "      <th>Mask_90</th>\n",
                            "      <th>Mask_91</th>\n",
                            "      <th>Mask_92</th>\n",
                            "      <th>Mask_93</th>\n",
                            "      <th>Mask_94</th>\n",
                            "      <th>Mask_95</th>\n",
                            "    </tr>\n",
                            "  </thead>\n",
                            "  <tbody>\n",
                            "    <tr>\n",
                            "      <th>0</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>1</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>578</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>2</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>599</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>3</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>693</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>4</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>720</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "  </tbody>\n",
                            "</table>\n",
                            "<p>5 rows × 194 columns</p>\n",
                            "</div>"
                        ],
                        "text/plain": [
                            "label_code        ID  Time  Value_0  Value_1  Value_2  Value_3  Value_4  \\\n",
                            "0           20000147     0      0.0      0.0      0.0      0.0      0.0   \n",
                            "1           20000147   578      0.0      0.0      0.0      0.0      0.0   \n",
                            "2           20000147   599      0.0      0.0      0.0      0.0      0.0   \n",
                            "3           20000147   693      0.0      0.0      0.0      0.0      0.0   \n",
                            "4           20000147   720      0.0      0.0      0.0      0.0      0.0   \n",
                            "\n",
                            "label_code  Value_5  Value_6  Value_7  ...  Mask_86  Mask_87  Mask_88  \\\n",
                            "0               0.0      0.0      0.0  ...        0        0        0   \n",
                            "1               0.0      0.0      0.0  ...        0        0        0   \n",
                            "2               0.0      0.0      0.0  ...        0        0        0   \n",
                            "3               0.0      0.0      0.0  ...        0        0        0   \n",
                            "4               0.0      0.0      0.0  ...        0        0        0   \n",
                            "\n",
                            "label_code  Mask_89  Mask_90  Mask_91  Mask_92  Mask_93  Mask_94  Mask_95  \n",
                            "0                 0        0        0        0        0        0        0  \n",
                            "1                 0        0        0        0        0        0        0  \n",
                            "2                 0        0        0        0        0        0        0  \n",
                            "3                 0        0        0        0        0        0        0  \n",
                            "4                 0        0        0        0        0        0        0  \n",
                            "\n",
                            "[5 rows x 194 columns]"
                        ]
                    },
                    "execution_count": 5,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "complete_df.head()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 6,
            "id": "d7423fd5",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "(5669792, 194)"
                        ]
                    },
                    "execution_count": 6,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "complete_df.shape"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 7,
            "id": "be2bd4dc",
            "metadata": {},
            "outputs": [],
            "source": [
                "# Calculate the standard deviation of elements along the axis 0. \n",
                "# Turn elements out of 5 times of the standard deviation into 0.\n",
                "def remove_outlier(data, mask, threshold=5):\n",
                "    mean = np.mean(data, axis=0)\n",
                "    std = np.std(data, axis=0)\n",
                "    mask_outlier = abs(data - mean) > threshold * std\n",
                "    data = np.where(mask_outlier, 0, data)\n",
                "    mask = np.where(mask_outlier, 0, mask)\n",
                "    return data, mask\n",
                "\n",
                "value_cols = []\n",
                "mask_cols = []\n",
                "for col in complete_df.columns:\n",
                "    value_cols.append(col.startswith(\"Value\"))\n",
                "    mask_cols.append(col.startswith(\"Mask\"))\n",
                "\n",
                "value = complete_df.loc[:, value_cols].values\n",
                "mask = complete_df.loc[:, mask_cols].values\n",
                "value_new, mask_new = remove_outlier(value, mask)\n",
                "complete_df.loc[:, value_cols] = value_new\n",
                "complete_df.loc[:, mask_cols] = mask_new\n",
                "complete_df = complete_df.loc[complete_df.loc[:, mask_cols].sum(axis=1) > 0]"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 8,
            "id": "5d5987d3",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "(4928295, 194)"
                        ]
                    },
                    "execution_count": 8,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "complete_df.shape"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 9,
            "id": "32b45828",
            "metadata": {},
            "outputs": [],
            "source": [
                "Mask_df = complete_df.filter(regex='^(?!.*Value).*', axis=1) # Exclude columns with Value in the name"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 10,
            "id": "bd54c227",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/html": [
                            "<div>\n",
                            "<style scoped>\n",
                            "    .dataframe tbody tr th:only-of-type {\n",
                            "        vertical-align: middle;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe tbody tr th {\n",
                            "        vertical-align: top;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe thead th {\n",
                            "        text-align: right;\n",
                            "    }\n",
                            "</style>\n",
                            "<table border=\"1\" class=\"dataframe\">\n",
                            "  <thead>\n",
                            "    <tr style=\"text-align: right;\">\n",
                            "      <th>label_code</th>\n",
                            "      <th>ID</th>\n",
                            "      <th>Time</th>\n",
                            "      <th>Mask_0</th>\n",
                            "      <th>Mask_1</th>\n",
                            "      <th>Mask_2</th>\n",
                            "      <th>Mask_3</th>\n",
                            "      <th>Mask_4</th>\n",
                            "      <th>Mask_5</th>\n",
                            "      <th>Mask_6</th>\n",
                            "      <th>Mask_7</th>\n",
                            "      <th>...</th>\n",
                            "      <th>Mask_86</th>\n",
                            "      <th>Mask_87</th>\n",
                            "      <th>Mask_88</th>\n",
                            "      <th>Mask_89</th>\n",
                            "      <th>Mask_90</th>\n",
                            "      <th>Mask_91</th>\n",
                            "      <th>Mask_92</th>\n",
                            "      <th>Mask_93</th>\n",
                            "      <th>Mask_94</th>\n",
                            "      <th>Mask_95</th>\n",
                            "    </tr>\n",
                            "  </thead>\n",
                            "  <tbody>\n",
                            "    <tr>\n",
                            "      <th>1</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>578</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>2</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>599</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>3</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>693</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>4</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>720</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>5</th>\n",
                            "      <td>20000147</td>\n",
                            "      <td>742</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "  </tbody>\n",
                            "</table>\n",
                            "<p>5 rows × 98 columns</p>\n",
                            "</div>"
                        ],
                        "text/plain": [
                            "label_code        ID  Time  Mask_0  Mask_1  Mask_2  Mask_3  Mask_4  Mask_5  \\\n",
                            "1           20000147   578       0       0       0       0       0       0   \n",
                            "2           20000147   599       0       0       0       0       0       0   \n",
                            "3           20000147   693       0       0       0       0       0       0   \n",
                            "4           20000147   720       0       0       0       0       0       0   \n",
                            "5           20000147   742       0       0       0       0       0       0   \n",
                            "\n",
                            "label_code  Mask_6  Mask_7  ...  Mask_86  Mask_87  Mask_88  Mask_89  Mask_90  \\\n",
                            "1                0       0  ...        0        0        0        0        0   \n",
                            "2                0       0  ...        0        0        0        0        0   \n",
                            "3                0       0  ...        0        0        0        0        0   \n",
                            "4                0       0  ...        0        0        0        0        0   \n",
                            "5                0       0  ...        0        0        0        0        0   \n",
                            "\n",
                            "label_code  Mask_91  Mask_92  Mask_93  Mask_94  Mask_95  \n",
                            "1                 0        0        0        0        0  \n",
                            "2                 0        0        0        0        0  \n",
                            "3                 0        0        0        0        0  \n",
                            "4                 0        0        0        0        0  \n",
                            "5                 0        0        0        0        0  \n",
                            "\n",
                            "[5 rows x 98 columns]"
                        ]
                    },
                    "execution_count": 10,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "Mask_df.head()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 11,
            "id": "5e8746aa",
            "metadata": {},
            "outputs": [],
            "source": [
                "tmp_df = Mask_df.groupby('ID').size()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 12,
            "id": "ffe5fb0d",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "<Axes: >"
                        ]
                    },
                    "execution_count": 12,
                    "metadata": {},
                    "output_type": "execute_result"
                },
                {
                    "data": {
                        "image/png": "iVBORw0KGgoAAAANSUhEUgAABk4AAAGsCAYAAACb5FtjAAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjAsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvlHJYcgAAAAlwSFlzAAAPYQAAD2EBqD+naQAANpFJREFUeJzt3Xt0VeWdP+BvgCSAGlCUBMrFtFoB8YoVMrbWC5IymS6tTFe11DKidenEjkDHCzNKQdvB0lG8oXSqFWdVxmpXtRVQiKA4jKCI0qK2VFssTjVhtRaioiEm+/fH7JyfKRcJt+RsnmetLDj7fc/Juw8fzjJ+ePcuSJIkCQAAAAAAAKJTey8AAAAAAACgo1CcAAAAAAAApBQnAAAAAAAAKcUJAAAAAABASnECAAAAAACQUpwAAAAAAACkFCcAAAAAAACpLu29gL2lubk53nzzzTjooIOioKCgvZcDAAAAAAC0oyRJ4p133om+fftGp07b31eS2eLkzTffjP79+7f3MgAAAAAAgA7kjTfeiH79+m13PLPFyUEHHRQR//cGlJSUtPNqOobGxsZYtGhRjBo1KgoLC9t7ObDLZJkskWeyQpbJEnkmK2SZLJFnskKWyZJ8zHN9fX30798/1x9sT2aLk5bLc5WUlChOUo2NjdG9e/coKSnJmyDDtsgyWSLPZIUskyXyTFbIMlkiz2SFLJMl+Zznj7u9h5vDAwAAAAAApBQnAAAAAAAAKcUJAAAAAABASnECAAAAAACQUpwAAAAAAACkFCcAAAAAAAApxQkAAAAAAEBKcQIAAAAAAJBSnAAAAAAAAKQUJwAAAAAAACnFCQAAAAAAQEpxAgAAAAAAkFKcAAAAAAAApBQnAAAAAAAAKcUJAAAAAABASnECAAAAAACQ6tLeC6BjOfya+dsde/3Gqn24EgAAAAAA2PfsOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAVJuKk6lTp0ZBQUGrr0GDBuXGP/jgg6iuro5evXrFgQceGGPGjIm6urpWr7F+/fqoqqqK7t27R+/evePKK6+MDz/8sNWcp556Kk488cQoLi6OI444IubMmbPrZwgAAAAAALCT2rzj5Oijj4633nor97Vs2bLc2MSJE+PRRx+Nhx56KJYuXRpvvvlmnHvuubnxpqamqKqqii1btsQzzzwT9913X8yZMyemTJmSm7Nu3bqoqqqK008/PVavXh0TJkyIiy++OBYuXLibpwoAAAAAALBjXdr8hC5doqysbKvjmzZtinvuuSfmzp0bZ5xxRkRE3HvvvTF48OBYsWJFjBgxIhYtWhSvvPJKPPHEE1FaWhrHH3983HDDDXH11VfH1KlTo6ioKGbPnh3l5eVx0003RUTE4MGDY9myZTFz5syorKzczdMFAAAAAADYvjYXJ6+++mr07ds3unbtGhUVFTF9+vQYMGBArFq1KhobG2PkyJG5uYMGDYoBAwbE8uXLY8SIEbF8+fI45phjorS0NDensrIyLrvssnj55ZfjhBNOiOXLl7d6jZY5EyZM2OG6GhoaoqGhIfe4vr4+IiIaGxujsbGxraeZSS3vw47ej+LOycc+H9rbzmQZ8oU8kxWyTJbIM1khy2SJPJMVskyW5GOed3atbSpOhg8fHnPmzImjjjoq3nrrrZg2bVp87nOfi5deeilqa2ujqKgoevbs2eo5paWlUVtbGxERtbW1rUqTlvGWsR3Nqa+vj/fffz+6deu2zbVNnz49pk2bttXxRYsWRffu3dtymplXU1Oz3bEZJ2//eQsWLNgLq4Fdt6MsQ76RZ7JClskSeSYrZJkskWeyQpbJknzK8+bNm3dqXpuKk9GjR+d+f+yxx8bw4cNj4MCB8eCDD2630NhXJk+eHJMmTco9rq+vj/79+8eoUaOipKSkHVfWcTQ2NkZNTU2cddZZUVhYuM05Q6du/14yL011qTQ6hp3JMuQLeSYrZJkskWeyQpbJEnkmK2SZLMnHPLdcqerjtPlSXR/Vs2fP+PSnPx2vvfZanHXWWbFly5bYuHFjq10ndXV1uXuilJWVxXPPPdfqNerq6nJjLb+2HPvonJKSkh2WM8XFxVFcXLzV8cLCwrz5Q9tXdvSeNDQV7PB50JH4+02WyDNZIctkiTyTFbJMlsgzWSHLZEk+5Xln19lpd77Ju+++G7/73e+iT58+MWzYsCgsLIzFixfnxteuXRvr16+PioqKiIioqKiINWvWxIYNG3JzampqoqSkJIYMGZKb89HXaJnT8hoAAAAAAAB7S5uKk3/+53+OpUuXxuuvvx7PPPNMfOlLX4rOnTvH+eefHz169IiLLrooJk2aFE8++WSsWrUqLrzwwqioqIgRI0ZERMSoUaNiyJAhccEFF8Qvf/nLWLhwYVx77bVRXV2d2y1y6aWXxu9///u46qqr4je/+U3ceeed8eCDD8bEiRP3/NkDAAAAAAB8RJsu1fW///u/cf7558ef//znOOyww+Kzn/1srFixIg477LCIiJg5c2Z06tQpxowZEw0NDVFZWRl33nln7vmdO3eOefPmxWWXXRYVFRVxwAEHxLhx4+L666/PzSkvL4/58+fHxIkT49Zbb41+/frF3XffHZWV7q8BAAAAAADsXW0qTh544IEdjnft2jVmzZoVs2bN2u6cgQMHxoIFC3b4Oqeddlq8+OKLbVkaAAAAAADAbtute5wAAAAAAABkieIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAILVbxcmNN94YBQUFMWHChNyxDz74IKqrq6NXr15x4IEHxpgxY6Kurq7V89avXx9VVVXRvXv36N27d1x55ZXx4Ycftprz1FNPxYknnhjFxcVxxBFHxJw5c3ZnqQAAAAAAAB9rl4uTlStXxg9+8IM49thjWx2fOHFiPProo/HQQw/F0qVL480334xzzz03N97U1BRVVVWxZcuWeOaZZ+K+++6LOXPmxJQpU3Jz1q1bF1VVVXH66afH6tWrY8KECXHxxRfHwoULd3W5AAAAAAAAH2uXipN33303xo4dGz/84Q/j4IMPzh3ftGlT3HPPPXHzzTfHGWecEcOGDYt77703nnnmmVixYkVERCxatCheeeWV+PGPfxzHH398jB49Om644YaYNWtWbNmyJSIiZs+eHeXl5XHTTTfF4MGD4/LLL4+///u/j5kzZ+6BUwYAAAAAANi2LrvypOrq6qiqqoqRI0fGd77zndzxVatWRWNjY4wcOTJ3bNCgQTFgwIBYvnx5jBgxIpYvXx7HHHNMlJaW5uZUVlbGZZddFi+//HKccMIJsXz58lav0TLno5cE+2sNDQ3R0NCQe1xfXx8REY2NjdHY2Lgrp5k5Le/Djt6P4s7Jxz4f2tvOZBnyhTyTFbJMlsgzWSHLZIk8kxWyTJbkY553dq1tLk4eeOCBeOGFF2LlypVbjdXW1kZRUVH07Nmz1fHS0tKora3NzfloadIy3jK2ozn19fXx/vvvR7du3bb63tOnT49p06ZtdXzRokXRvXv3nT/B/UBNTc12x2acvP3nLViwYC+sBnbdjrIM+UaeyQpZJkvkmayQZbJEnskKWSZL8inPmzdv3ql5bSpO3njjjbjiiiuipqYmunbtuksL21smT54ckyZNyj2ur6+P/v37x6hRo6KkpKQdV9ZxNDY2Rk1NTZx11llRWFi4zTlDp27/PjIvTa3cW0uDNtmZLEO+kGeyQpbJEnkmK2SZLJFnskKWyZJ8zHPLlao+TpuKk1WrVsWGDRvixBNPzB1ramqKp59+Ou64445YuHBhbNmyJTZu3Nhq10ldXV2UlZVFRERZWVk899xzrV63rq4uN9bya8uxj84pKSnZ5m6TiIji4uIoLi7e6nhhYWHe/KHtKzt6TxqaCnb4POhI/P0mS+SZrJBlskSeyQpZJkvkmayQZbIkn/K8s+ts083hzzzzzFizZk2sXr0693XSSSfF2LFjc78vLCyMxYsX556zdu3aWL9+fVRUVEREREVFRaxZsyY2bNiQm1NTUxMlJSUxZMiQ3JyPvkbLnJbXAAAAAAAA2BvatOPkoIMOiqFDh7Y6dsABB0SvXr1yxy+66KKYNGlSHHLIIVFSUhLf/OY3o6KiIkaMGBEREaNGjYohQ4bEBRdcEDNmzIja2tq49tpro7q6Ordj5NJLL4077rgjrrrqqhg/fnwsWbIkHnzwwZg/f/6eOGcAAAAAAIBtavPN4T/OzJkzo1OnTjFmzJhoaGiIysrKuPPOO3PjnTt3jnnz5sVll10WFRUVccABB8S4cePi+uuvz80pLy+P+fPnx8SJE+PWW2+Nfv36xd133x2Vle6xAQAAAAAA7D27XZw89dRTrR537do1Zs2aFbNmzdrucwYOHBgLFizY4euedtpp8eKLL+7u8gAAAAAAAHZam+5xAgAAAAAAkGWKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAg1aW9F8C+N3TqwmhoKmjvZQAAAAAAQIdjxwkAAAAAAEBKcQIAAAAAAJBSnAAAAAAAAKQUJwAAAAAAACnFCQAAAAAAQEpxAgAAAAAAkFKcAAAAAAAApBQnAAAAAAAAKcUJAAAAAABASnECAAAAAACQUpwAAAAAAACkFCcAAAAAAAApxQkAAAAAAECqTcXJXXfdFccee2yUlJRESUlJVFRUxGOPPZYb/+CDD6K6ujp69eoVBx54YIwZMybq6upavcb69eujqqoqunfvHr17944rr7wyPvzww1ZznnrqqTjxxBOjuLg4jjjiiJgzZ86unyEAAAAAAMBOalNx0q9fv7jxxhtj1apV8fzzz8cZZ5wRZ599drz88ssRETFx4sR49NFH46GHHoqlS5fGm2++Geeee27u+U1NTVFVVRVbtmyJZ555Ju67776YM2dOTJkyJTdn3bp1UVVVFaeffnqsXr06JkyYEBdffHEsXLhwD50yAAAAAADAtnVpy+QvfvGLrR5/97vfjbvuuitWrFgR/fr1i3vuuSfmzp0bZ5xxRkRE3HvvvTF48OBYsWJFjBgxIhYtWhSvvPJKPPHEE1FaWhrHH3983HDDDXH11VfH1KlTo6ioKGbPnh3l5eVx0003RUTE4MGDY9myZTFz5syorKzcQ6cNAAAAAACwtTYVJx/V1NQUDz30ULz33ntRUVERq1atisbGxhg5cmRuzqBBg2LAgAGxfPnyGDFiRCxfvjyOOeaYKC0tzc2prKyMyy67LF5++eU44YQTYvny5a1eo2XOhAkTdriehoaGaGhoyD2ur6+PiIjGxsZobGzc1dPMlJb3obhTslvPh/bWkkWZJAvkmayQZbJEnskKWSZL5JmskGWyJB/zvLNrbXNxsmbNmqioqIgPPvggDjzwwHj44YdjyJAhsXr16igqKoqePXu2ml9aWhq1tbUREVFbW9uqNGkZbxnb0Zz6+vp4//33o1u3bttc1/Tp02PatGlbHV+0aFF07969raeZaTec1LxLz1uwYMEeXgnsnpqamvZeAuwx8kxWyDJZIs9khSyTJfJMVsgyWZJPed68efNOzWtzcXLUUUfF6tWrY9OmTfHTn/40xo0bF0uXLm3zAve0yZMnx6RJk3KP6+vro3///jFq1KgoKSlpx5V1HI2NjVFTUxPXPd8pGpoL2vz8l6a6VBodQ0uWzzrrrCgsLGzv5cBukWeyQpbJEnkmK2SZLJFnskKWyZJ8zHPLlao+TpuLk6KiojjiiCMiImLYsGGxcuXKuPXWW+MrX/lKbNmyJTZu3Nhq10ldXV2UlZVFRERZWVk899xzrV6vrq4uN9bya8uxj84pKSnZ7m6TiIji4uIoLi7e6nhhYWHe/KHtKw3NBdHQ1PbixPtIR+PvN1kiz2SFLJMl8kxWyDJZIs9khSyTJfmU551dZ6fd/UbNzc3R0NAQw4YNi8LCwli8eHFubO3atbF+/fqoqKiIiIiKiopYs2ZNbNiwITenpqYmSkpKYsiQIbk5H32NljktrwEAAAAAALC3tGnHyeTJk2P06NExYMCAeOedd2Lu3Lnx1FNPxcKFC6NHjx5x0UUXxaRJk+KQQw6JkpKS+OY3vxkVFRUxYsSIiIgYNWpUDBkyJC644IKYMWNG1NbWxrXXXhvV1dW53SKXXnpp3HHHHXHVVVfF+PHjY8mSJfHggw/G/Pnz9/zZAwAAAAAAfESbipMNGzbE17/+9XjrrbeiR48eceyxx8bChQvjrLPOioiImTNnRqdOnWLMmDHR0NAQlZWVceedd+ae37lz55g3b15cdtllUVFREQcccECMGzcurr/++tyc8vLymD9/fkycODFuvfXW6NevX9x9991RWen+GgAAAAAAwN7VpuLknnvu2eF4165dY9asWTFr1qztzhk4cGAsWLBgh69z2mmnxYsvvtiWpQEAAAAAAOy23b7HCQAAAAAAQFYoTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAIBUl/ZeAPnj8Gvmb3fs9Rur9uFKAAAAAABg77DjBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEi1qTiZPn16fOYzn4mDDjooevfuHeecc06sXbu21ZwPPvggqquro1evXnHggQfGmDFjoq6urtWc9evXR1VVVXTv3j169+4dV155ZXz44Yet5jz11FNx4oknRnFxcRxxxBExZ86cXTtDAAAAAACAndSm4mTp0qVRXV0dK1asiJqammhsbIxRo0bFe++9l5szceLEePTRR+Ohhx6KpUuXxptvvhnnnntubrypqSmqqqpiy5Yt8cwzz8R9990Xc+bMiSlTpuTmrFu3LqqqquL000+P1atXx4QJE+Liiy+OhQsX7oFTBgAAAAAA2LYubZn8+OOPt3o8Z86c6N27d6xatSpOPfXU2LRpU9xzzz0xd+7cOOOMMyIi4t57743BgwfHihUrYsSIEbFo0aJ45ZVX4oknnojS0tI4/vjj44Ybboirr746pk6dGkVFRTF79uwoLy+Pm266KSIiBg8eHMuWLYuZM2dGZWXlNtfW0NAQDQ0Nucf19fUREdHY2BiNjY1tOc3Mankfijsle/y1j/rXedsde2nqtv/MYFe1ZNnfbbJAnskKWSZL5JmskGWyRJ7JClkmS/Ixzzu71oIkSXb5/6K/9tprceSRR8aaNWti6NChsWTJkjjzzDPjL3/5S/Ts2TM3b+DAgTFhwoSYOHFiTJkyJX7xi1/E6tWrc+Pr1q2LT37yk/HCCy/ECSecEKeeemqceOKJccstt+Tm3HvvvTFhwoTYtGnTNtcyderUmDZt2lbH586dG927d9/VUwQAAAAAADJg8+bN8dWvfjU2bdoUJSUl253Xph0nH9Xc3BwTJkyIU045JYYOHRoREbW1tVFUVNSqNImIKC0tjdra2tyc0tLSrcZbxnY0p76+Pt5///3o1q3bVuuZPHlyTJo0Kfe4vr4++vfvH6NGjdrhG7A/aWxsjJqamrju+U7R0Fywz76vHSfsaS1ZPuuss6KwsLC9lwO7RZ7JClkmS+SZrJBlskSeyQpZJkvyMc8tV6r6OLtcnFRXV8dLL70Uy5Yt29WX2KOKi4ujuLh4q+OFhYV584e2rzQ0F0RD074rTrz/7C3+fpMl8kxWyDJZIs9khSyTJfJMVsgyWZJPed7Zdbbp5vAtLr/88pg3b148+eST0a9fv9zxsrKy2LJlS2zcuLHV/Lq6uigrK8vNqaur22q8ZWxHc0pKSra52wQAAAAAAGBPaFNxkiRJXH755fHwww/HkiVLory8vNX4sGHDorCwMBYvXpw7tnbt2li/fn1UVFRERERFRUWsWbMmNmzYkJtTU1MTJSUlMWTIkNycj75Gy5yW1wAAAAAAANgb2nSprurq6pg7d278/Oc/j4MOOih3T5IePXpEt27dokePHnHRRRfFpEmT4pBDDomSkpL45je/GRUVFTFixIiIiBg1alQMGTIkLrjggpgxY0bU1tbGtddeG9XV1blLbV166aVxxx13xFVXXRXjx4+PJUuWxIMPPhjz58/fw6cPAAAAAADw/7Vpx8ldd90VmzZtitNOOy369OmT+/rJT36SmzNz5sz4u7/7uxgzZkyceuqpUVZWFj/72c9y4507d4558+ZF586do6KiIr72ta/F17/+9bj++utzc8rLy2P+/PlRU1MTxx13XNx0001x9913R2Wlm4wDAAAAAAB7T5t2nCRJ8rFzunbtGrNmzYpZs2Ztd87AgQNjwYIFO3yd0047LV588cW2LA8AAAAAAGC37NLN4QEAAAAAALJIcQIAAAAAAJBSnAAAAAAAAKQUJwAAAAAAACnFCQAAAAAAQEpxAgAAAAAAkFKcAAAAAAAApBQnAAAAAAAAKcUJAAAAAABASnECAAAAAACQUpwAAAAAAACkurT3Asi+w6+Zv8Px12+s2kcrAQAAAACAHbPjBAAAAAAAIKU4AQAAAAAASClOAAAAAAAAUooTAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAINWlvRcAh18zf7tjr99YtQ9XAgAAAADA/s6OEwAAAAAAgJTiBAAAAAAAIOVSXXRoO7qM1464xBcAAAAAALvCjhMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgFSX9l4A7A2HXzN/u2Ov31i1D1cCAAAAAEA+seMEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICUm8PDR7ipPAAAAADA/s2OEwAAAAAAgJTiBAAAAAAAIOVSXex3dnQ5LgAAAAAA9m92nAAAAAAAAKQUJwAAAAAAACnFCQAAAAAAQEpxAgAAAAAAkFKcAAAAAAAApBQnAAAAAAAAKcUJAAAAAABASnECAAAAAACQ6tLeC4B8cfg187c79vqNVftwJQAAAAAA7C12nAAAAAAAAKQUJwAAAAAAACnFCQAAAAAAQEpxAgAAAAAAkFKcAAAAAAAApNpcnDz99NPxxS9+Mfr27RsFBQXxyCOPtBpPkiSmTJkSffr0iW7dusXIkSPj1VdfbTXn7bffjrFjx0ZJSUn07NkzLrroonj33XdbzfnVr34Vn/vc56Jr167Rv3//mDFjRtvPDgAAAAAAoA26tPUJ7733Xhx33HExfvz4OPfcc7canzFjRtx2221x3333RXl5eVx33XVRWVkZr7zySnTt2jUiIsaOHRtvvfVW1NTURGNjY1x44YVxySWXxNy5cyMior6+PkaNGhUjR46M2bNnx5o1a2L8+PHRs2fPuOSSS3bzlGHPO/ya+dsde/3Gqn24EgAAAAAAdkebi5PRo0fH6NGjtzmWJEnccsstce2118bZZ58dERH/+Z//GaWlpfHII4/EeeedF7/+9a/j8ccfj5UrV8ZJJ50UERG33357/O3f/m38+7//e/Tt2zfuv//+2LJlS/zoRz+KoqKiOProo2P16tVx8803K04AAAAAAIC9ps3FyY6sW7cuamtrY+TIkbljPXr0iOHDh8fy5cvjvPPOi+XLl0fPnj1zpUlExMiRI6NTp07x7LPPxpe+9KVYvnx5nHrqqVFUVJSbU1lZGd/73vfiL3/5Sxx88MFbfe+GhoZoaGjIPa6vr4+IiMbGxmhsbNyTp5m3Wt6H4k5JO69k/yJ/e17Le+q9JQvkmayQZbJEnskKWSZL5JmskGWyJB/zvLNr3aPFSW1tbURElJaWtjpeWlqaG6utrY3evXu3XkSXLnHIIYe0mlNeXr7Va7SMbas4mT59ekybNm2r44sWLYru3bvv4hll0w0nNbf3EvYrCxYsaO8lZFZNTU17LwH2GHkmK2SZLJFnskKWyRJ5JitkmSzJpzxv3rx5p+bt0eKkPU2ePDkmTZqUe1xfXx/9+/ePUaNGRUlJSTuurONobGyMmpqauO75TtHQXNDey9lvvDS1sr2XkDktWT7rrLOisLCwvZcDu0WeyQpZJkvkmayQZbJEnskKWSZL8jHPLVeq+jh7tDgpKyuLiIi6urro06dP7nhdXV0cf/zxuTkbNmxo9bwPP/ww3n777dzzy8rKoq6urtWclsctc/5acXFxFBcXb3W8sLAwb/7Q9pWG5oJoaFKc7Cvyt/f4+02WyDNZIctkiTyTFbJMlsgzWSHLZEk+5Xln19lpT37T8vLyKCsri8WLF+eO1dfXx7PPPhsVFRUREVFRUREbN26MVatW5eYsWbIkmpubY/jw4bk5Tz/9dKvrjdXU1MRRRx21zct0AQAAAAAA7Alt3nHy7rvvxmuvvZZ7vG7duli9enUccsghMWDAgJgwYUJ85zvfiSOPPDLKy8vjuuuui759+8Y555wTERGDBw+OL3zhC/GNb3wjZs+eHY2NjXH55ZfHeeedF3379o2IiK9+9asxbdq0uOiii+Lqq6+Ol156KW699daYOXPmnjlr6CAOv2b+dsdev7FqH64EAAAAAICIXShOnn/++Tj99NNzj1vuKzJu3LiYM2dOXHXVVfHee+/FJZdcEhs3bozPfvaz8fjjj0fXrl1zz7n//vvj8ssvjzPPPDM6deoUY8aMidtuuy033qNHj1i0aFFUV1fHsGHD4tBDD40pU6bEJZdcsjvnCgAAAAAAsENtLk5OO+20SJJku+MFBQVx/fXXx/XXX7/dOYccckjMnTt3h9/n2GOPjf/+7/9u6/IAAAAAAAB22R69xwkAAAAAAEA+a/OOE2DfcP8TAAAAAIB9z44TAAAAAACAlOIEAAAAAAAg5VJdkIdcxgsAAAAAYO+w4wQAAAAAACBlxwlkjN0oAAAAAAC7zo4TAAAAAACAlOIEAAAAAAAg5VJdQETs+BJfO7Krl/9ySTEAAAAAoCOy4wQAAAAAACBlxwmwW+wcAQAAAACyRHEC+5FdvRzX/k45BAAAAAD7D5fqAgAAAAAASNlxAnvZ/rzLo6Odu50jAAAAAMDHUZwAeeXwa+ZHceckZpwcMXTqwmhoKsiNKT8AAAAAgN3lUl0AAAAAAAApO04AdsOuXv7LZcMAAAAAoGNSnAAdTnvcG2VvfM+Odo8XAAAAAODjuVQXAAAAAABASnECAAAAAACQcqkugA5mb1ziy31TAAAAAGDnKE4A9gNuRg8AAAAAO8elugAAAAAAAFJ2nACwXXaqAAAAALC/UZwA7Of2xj1VAAAAACBfuVQXAAAAAABAyo4TAPY4l/gCAAAAIF8pToDMcMkpAAAAAGB3uVQXAAAAAABASnECAAAAAACQcqkuAPYp9z8BAAAAoCOz4wQAAAAAACBlxwkAHcaOdqPsiJ0qAAAAAOwpdpwAAAAAAACk7DgBYJfs6u4QAAAAAOjIFCcA5D03nAcAAABgT1GcAJBpShUAAAAA2kJxAsB+S6kCAAAAwF9TnABAG33c/V2ULgAAAAD5S3ECANvwceUIAAAAANmkOAGADsKlwwAAAADan+IEAPawtuxWKe6cxIyTI4ZOXRgRBXtvUQAAAADslE7tvQAAAAAAAICOwo4TANhPuTQYAAAAwNYUJwCQB3a15NgbN7lXuAAAAABZpjgBALayNwoXAAAAgHygOAEA9phdLVzsVAEAAAA6CsUJANChuTQYAAAAsC8pTgAgz+3Pl9WywwUAAADY0xQnAEC725/LHwAAAKBjUZwAAPudvXH5L5cUAwAAgGxQnAAAfERHKlU+bieOQgYAAAD2PMUJAEA7cpkyAAAA6FgUJwAAeaojlS6v3jCqvZcAAAAAe4TiBABgJ3WkoqKjGTp1Ycw4+f9+bWgqaDW2q5cj2xuXInMvGgAAAD6O4gQAgL1qVwunfV1U7Y3vt6/viwMAAMDuU5wAAMBesjcKkI5U8AAAAGRRhy5OZs2aFd///vejtrY2jjvuuLj99tvj5JNPbu9lAQDAbutIl37rSGv5OB3p0m8AAEA2ddji5Cc/+UlMmjQpZs+eHcOHD49bbrklKisrY+3atdG7d+/2Xh4AANAO9sWl34o7J9u9Z8+esK/v37Mj7iUEAABb67DFyc033xzf+MY34sILL4yIiNmzZ8f8+fPjRz/6UVxzzTVbzW9oaIiGhobc402bNkVExNtvvx2NjY37ZtEdXGNjY2zevDm6NHaKpuY9/wMg7CtdmpPYvLlZlskEeSYrZJks2dt5PuKfH9zjr7mrP9jt67Xsje/3cZ6dfOYef83h0xfv0vfb189r+Rnwz3/+cxQWFm533p6yq+uEnbGv8wx7iyyTJfmY53feeSciIpIk2eG8guTjZrSDLVu2RPfu3eOnP/1pnHPOObnj48aNi40bN8bPf/7zrZ4zderUmDZt2j5cJQAAAAAAkG/eeOON6Nev33bHO+SOkz/96U/R1NQUpaWlrY6XlpbGb37zm20+Z/LkyTFp0qTc4+bm5nj77bejV69eUVDgXz1GRNTX10f//v3jjTfeiJKSkvZeDuwyWSZL5JmskGWyRJ7JClkmS+SZrJBlsiQf85wkSbzzzjvRt2/fHc7rkMXJriguLo7i4uJWx3r27Nk+i+ngSkpK8ibIsCOyTJbIM1khy2SJPJMVskyWyDNZIctkSb7luUePHh87p9M+WEebHXroodG5c+eoq6trdbyuri7KysraaVUAAAAAAEDWdcjipKioKIYNGxaLF///G8s1NzfH4sWLo6Kioh1XBgAAAAAAZFmHvVTXpEmTYty4cXHSSSfFySefHLfccku89957ceGFF7b30vJWcXFxfPvb397qkmaQb2SZLJFnskKWyRJ5JitkmSyRZ7JClsmSLOe5IEmSpL0XsT133HFHfP/734/a2to4/vjj47bbbovhw4e397IAAAAAAICM6tDFCQAAAAAAwL7UIe9xAgAAAAAA0B4UJwAAAAAAACnFCQAAAAAAQEpxAgAAAAAAkFKc7CdmzZoVhx9+eHTt2jWGDx8ezz33XHsvCVp5+umn44tf/GL07ds3CgoK4pFHHmk1niRJTJkyJfr06RPdunWLkSNHxquvvtpqzttvvx1jx46NkpKS6NmzZ1x00UXx7rvv7sOzgIjp06fHZz7zmTjooIOid+/ecc4558TatWtbzfnggw+iuro6evXqFQceeGCMGTMm6urqWs1Zv359VFVVRffu3aN3795x5ZVXxocffrgvTwXirrvuimOPPTZKSkqipKQkKioq4rHHHsuNyzL56sYbb4yCgoKYMGFC7pg8ky+mTp0aBQUFrb4GDRqUG5dl8skf//jH+NrXvha9evWKbt26xTHHHBPPP/98btzPgeSLww8/fKvP5oKCgqiuro4In83kj6amprjuuuuivLw8unXrFp/61KfihhtuiCRJcnP2l89mxcl+4Cc/+UlMmjQpvv3tb8cLL7wQxx13XFRWVsaGDRvae2mQ895778Vxxx0Xs2bN2ub4jBkz4rbbbovZs2fHs88+GwcccEBUVlbGBx98kJszduzYePnll6OmpibmzZsXTz/9dFxyySX76hQgIiKWLl0a1dXVsWLFiqipqYnGxsYYNWpUvPfee7k5EydOjEcffTQeeuihWLp0abz55ptx7rnn5sabmpqiqqoqtmzZEs8880zcd999MWfOnJgyZUp7nBL7sX79+sWNN94Yq1atiueffz7OOOOMOPvss+Pll1+OCFkmP61cuTJ+8IMfxLHHHtvquDyTT44++uh46623cl/Lli3Ljcky+eIvf/lLnHLKKVFYWBiPPfZYvPLKK3HTTTfFwQcfnJvj50DyxcqVK1t9LtfU1ERExJe//OWI8NlM/vje974Xd911V9xxxx3x61//Or73ve/FjBkz4vbbb8/N2W8+mxMy7+STT06qq6tzj5uampK+ffsm06dPb8dVwfZFRPLwww/nHjc3NydlZWXJ97///dyxjRs3JsXFxcl//dd/JUmSJK+88koSEcnKlStzcx577LGkoKAg+eMf/7jP1g5/bcOGDUlEJEuXLk2S5P+yW1hYmDz00EO5Ob/+9a+TiEiWL1+eJEmSLFiwIOnUqVNSW1ubm3PXXXclJSUlSUNDw749AfgrBx98cHL33XfLMnnpnXfeSY488sikpqYm+fznP59cccUVSZL4bCa/fPvb306OO+64bY7JMvnk6quvTj772c9ud9zPgeSzK664IvnUpz6VNDc3+2wmr1RVVSXjx49vdezcc89Nxo4dmyTJ/vXZbMdJxm3ZsiVWrVoVI0eOzB3r1KlTjBw5MpYvX96OK4Odt27duqitrW2V4x49esTw4cNzOV6+fHn07NkzTjrppNyckSNHRqdOneLZZ5/d52uGFps2bYqIiEMOOSQiIlatWhWNjY2t8jxo0KAYMGBAqzwfc8wxUVpamptTWVkZ9fX1uX/pD/taU1NTPPDAA/Hee+9FRUWFLJOXqquro6qqqlVuI3w2k39effXV6Nu3b3zyk5+MsWPHxvr16yNClskvv/jFL+Kkk06KL3/5y9G7d+844YQT4oc//GFu3M+B5KstW7bEj3/84xg/fnwUFBT4bCav/M3f/E0sXrw4fvvb30ZExC9/+ctYtmxZjB49OiL2r8/mLu29APauP/3pT9HU1NTqgzciorS0NH7zm9+006qgbWprayMitpnjlrHa2tro3bt3q/EuXbrEIYcckpsD+1pzc3NMmDAhTjnllBg6dGhE/F9Wi4qKomfPnq3m/nWet5X3ljHYl9asWRMVFRXxwQcfxIEHHhgPP/xwDBkyJFavXi3L5JUHHnggXnjhhVi5cuVWYz6bySfDhw+POXPmxFFHHRVvvfVWTJs2LT73uc/FSy+9JMvkld///vdx1113xaRJk+Jf/uVfYuXKlfFP//RPUVRUFOPGjfNzIHnrkUceiY0bN8Y//MM/RIT/ziC/XHPNNVFfXx+DBg2Kzp07R1NTU3z3u9+NsWPHRsT+9f/oFCcAsJdUV1fHSy+91Oq645BvjjrqqFi9enVs2rQpfvrTn8a4ceNi6dKl7b0saJM33ngjrrjiiqipqYmuXbu293Jgt7T8i8+IiGOPPTaGDx8eAwcOjAcffDC6devWjiuDtmlubo6TTjop/u3f/i0iIk444YR46aWXYvbs2TFu3Lh2Xh3sunvuuSdGjx4dffv2be+lQJs9+OCDcf/998fcuXPj6KOPjtWrV8eECROib9+++91ns0t1Zdyhhx4anTt3jrq6ulbH6+rqoqysrJ1WBW3TktUd5bisrCw2bNjQavzDDz+Mt99+W9ZpF5dffnnMmzcvnnzyyejXr1/ueFlZWWzZsiU2btzYav5f53lbeW8Zg32pqKgojjjiiBg2bFhMnz49jjvuuLj11ltlmbyyatWq2LBhQ5x44onRpUuX6NKlSyxdujRuu+226NKlS5SWlsozeatnz57x6U9/Ol577TWfzeSVPn36xJAhQ1odGzx4cO7Sc34OJB/94Q9/iCeeeCIuvvji3DGfzeSTK6+8Mq655po477zz4phjjokLLrggJk6cGNOnT4+I/euzWXGScUVFRTFs2LBYvHhx7lhzc3MsXrw4Kioq2nFlsPPKy8ujrKysVY7r6+vj2WefzeW4oqIiNm7cGKtWrcrNWbJkSTQ3N8fw4cP3+ZrZfyVJEpdffnk8/PDDsWTJkigvL281PmzYsCgsLGyV57Vr18b69etb5XnNmjWt/kOjpqYmSkpKtvrhEva15ubmaGhokGXyyplnnhlr1qyJ1atX575OOumkGDt2bO738ky+evfdd+N3v/td9OnTx2czeeWUU06JtWvXtjr229/+NgYOHBgRfg4kP917773Ru3fvqKqqyh3z2Uw+2bx5c3Tq1Loy6Ny5czQ3N0fEfvbZ3N53p2fve+CBB5Li4uJkzpw5ySuvvJJccsklSc+ePZPa2tr2XhrkvPPOO8mLL76YvPjii0lEJDfffHPy4osvJn/4wx+SJEmSG2+8MenZs2fy85//PPnVr36VnH322Ul5eXny/vvv517jC1/4QnLCCSckzz77bLJs2bLkyCOPTM4///z2OiX2U5dddlnSo0eP5Kmnnkreeuut3NfmzZtzcy699NJkwIAByZIlS5Lnn38+qaioSCoqKnLjH374YTJ06NBk1KhRyerVq5PHH388Oeyww5LJkye3xymxH7vmmmuSpUuXJuvWrUt+9atfJddcc01SUFCQLFq0KEkSWSa/ff7zn0+uuOKK3GN5Jl9861vfSp566qlk3bp1yf/8z/8kI0eOTA499NBkw4YNSZLIMvnjueeeS7p06ZJ897vfTV599dXk/vvvT7p37578+Mc/zs3xcyD5pKmpKRkwYEBy9dVXbzXms5l8MW7cuOQTn/hEMm/evGTdunXJz372s+TQQw9Nrrrqqtyc/eWzWXGyn7j99tuTAQMGJEVFRcnJJ5+crFixor2XBK08+eSTSURs9TVu3LgkSZKkubk5ue6665LS0tKkuLg4OfPMM5O1a9e2eo0///nPyfnnn58ceOCBSUlJSXLhhRcm77zzTjucDfuzbeU4IpJ77703N+f9999P/vEf/zE5+OCDk+7duydf+tKXkrfeeqvV67z++uvJ6NGjk27duiWHHnpo8q1vfStpbGzcx2fD/m78+PHJwIEDk6KiouSwww5LzjzzzFxpkiSyTH776+JEnskXX/nKV5I+ffokRUVFySc+8YnkK1/5SvLaa6/lxmWZfPLoo48mQ4cOTYqLi5NBgwYl//Ef/9Fq3M+B5JOFCxcmEbFVRpPEZzP5o76+PrniiiuSAQMGJF27dk0++clPJv/6r/+aNDQ05ObsL5/NBUmSJO2y1QUAAAAAAKCDcY8TAAAAAACAlOIEAAAAAAAgpTgBAAAAAABIKU4AAAAAAABSihMAAAAAAICU4gQAAAAAACClOAEAAAAAAEgpTgAAAAAAAFKKEwAAAAAAgJTiBAAAAAAAIKU4AQAAAAAASP0/Q0iYS/ztP/oAAAAASUVORK5CYII=",
                        "text/plain": [
                            "<Figure size 2000x500 with 1 Axes>"
                        ]
                    },
                    "metadata": {},
                    "output_type": "display_data"
                }
            ],
            "source": [
                "# Plot the distribution of the number of records for each patient\n",
                "tmp_df.hist(bins=200, figsize=(20, 5))"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 13,
            "id": "7052d2af",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "count    54442.000000\n",
                            "mean        90.523768\n",
                            "std         93.922978\n",
                            "min          1.000000\n",
                            "25%         17.000000\n",
                            "50%         59.000000\n",
                            "75%        135.000000\n",
                            "max        786.000000\n",
                            "dtype: float64"
                        ]
                    },
                    "execution_count": 13,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "tmp_df.describe()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 14,
            "metadata": {},
            "outputs": [],
            "source": [
                "ids_before = Mask_df.loc[Mask_df['Time'] < 1440].groupby('ID').size()\n",
                "ids_after = Mask_df.loc[Mask_df['Time'] > 1440].groupby('ID').size()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 15,
            "id": "fa316b18",
            "metadata": {},
            "outputs": [
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "ids_before_selected:  (31803,)\n",
                        "ids_after_selected:  (27319,)\n"
                    ]
                }
            ],
            "source": [
                "ids_before_selected = ids_before.loc[ids_before >= 20].index\n",
                "ids_after_selected = ids_after.loc[ids_after >= 20].index\n",
                "\n",
                "print(\"ids_before_selected: \", ids_before_selected.shape)\n",
                "print(\"ids_after_selected: \", ids_after_selected.shape)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "metadata": {},
            "outputs": [],
            "source": []
        },
        {
            "cell_type": "code",
            "execution_count": 23,
            "metadata": {},
            "outputs": [],
            "source": [
                "# df_var_num = Mask_df.iloc[:, 1:].groupby(\"ID\").apply(lambda x: x.sum(axis=0).gt(0).sum())\n",
                "\n",
                "feature_cols = [col for col in Mask_df.columns if col != \"ID\"]\n",
                "df_var_num = Mask_df.groupby(\"ID\")[feature_cols].apply(\n",
                "    lambda x: x.sum(axis=0).gt(0).sum()\n",
                ")"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 24,
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "<Axes: >"
                        ]
                    },
                    "execution_count": 24,
                    "metadata": {},
                    "output_type": "execute_result"
                },
                {
                    "data": {
                        "image/png": "iVBORw0KGgoAAAANSUhEUgAAAjYAAAGdCAYAAAABhTmFAAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjAsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvlHJYcgAAAAlwSFlzAAAPYQAAD2EBqD+naQAAKdVJREFUeJzt3X9w1PWdx/HXJiQLATbhh8mSI4RYT34KnCBhx8qBhASaeqLMnBQqHKUycolTTA8lNwoBqiBWVCwVO1bDzZGC3hRbgQILlFAkgKTkELAZ8cDYg4Q7abKQSFjI9/7w8i2bLJCETTZ88nzM7Mh+v+/P9/vZ935ZXn73u7sOy7IsAQAAGCAi3BMAAAAIFYINAAAwBsEGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYncI9gdZSV1enM2fOqHv37nI4HOGeDgAAaALLsnThwgUlJiYqIqL551+MDTZnzpxRUlJSuKcBAABa4Msvv1Tfvn2bPc7YYNO9e3dJ3zTG5XI1aYzf79eOHTuUnp6uqKio1pwegqD/4UX/w4v+hxf9D5+Gvff5fEpKSrL/HW8uY4NN/dtPLperWcEmJiZGLpeLAzsM6H940f/wov/hRf/D53q9b+llJFw8DAAAjEGwAQAAxiDYAAAAYxBsAACAMQg2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYBBsAAGCMTuGeAIDbQ/+FWwLun16RGaaZAMD1EWwAqP/CLXJGWlo5Whqat12lL3y3Vfd1LQISgFDirSgAAGAMgg0AADAGwQYAABiDYAMAAIzBxcOA4bhYF0BHwhkbAABgDM7YAGh3OMsEoKU4YwMAAIxBsAEAAMYg2AAAAGMQbAAAgDG4eBhAyHDRL4Bw44wNAAAwBsEGAAAYg2ADAACMwTU2AIzQ8PoeiWt8gI6IMzYAAMAYzQo2y5cv13333afu3bsrPj5eU6ZMUWlpaUDNuHHj5HA4Am5PPvlkQE1ZWZkyMzMVExOj+Ph4LViwQFeuXAmo2bNnj+699145nU7dddddys/Pb9kjBAAAHUazgk1hYaGysrJ04MABeb1e+f1+paenq7q6OqDuiSee0NmzZ+3bypUr7XVXr15VZmamLl++rP3792vdunXKz8/XokWL7JpTp04pMzNT48ePV0lJiebPn68f/vCH2r59+y0+XAAAYLJmXWOzbdu2gPv5+fmKj49XcXGxxo4day+PiYmR2+0Ouo0dO3boxIkT2rlzpxISEjRixAgtW7ZMzz77rPLy8hQdHa21a9cqJSVFr7zyiiRp0KBB2rdvn1599VVlZGQ09zECAIAO4pausamqqpIk9ezZM2D5+vXr1bt3bw0dOlS5ubmqqamx1xUVFemee+5RQkKCvSwjI0M+n0/Hjx+3a9LS0gK2mZGRoaKioluZLgAAMFyLPxVVV1en+fPn6/7779fQoUPt5dOnT1dycrISExN19OhRPfvssyotLdWvf/1rSVJ5eXlAqJFk3y8vL79hjc/n09dff60uXbo0mk9tba1qa2vt+z6fT5Lk9/vl9/ub9Jjq65paj9Ci/63DGWkF3A/WX2ekJWfEN3XOCOu6NU3ZTlvV3GxMU8e1Fxz/4UX/w6dh72/1OXBYltX41aAJ5s2bp9/97nfat2+f+vbte9263bt3a8KECTp58qS+9a1vae7cufriiy8CrpepqalR165dtXXrVk2ePFl33323Zs+erdzcXLtm69atyszMVE1NTdBgk5eXpyVLljRaXlBQoJiYmJY8RAAA0MZqamo0ffp0VVVVyeVyNXt8i87YZGdna/Pmzdq7d+8NQ40kpaamSpIdbNxutw4dOhRQU1FRIUn2dTlut9tedm2Ny+UKGmokKTc3Vzk5OfZ9n8+npKQkpaenN7kxfr9fXq9XEydOVFRUVJPGIHTof+sYmhd40f2xvMbXqQ3N2y5nhKVlo+r0/OEIFS+a1OLttFXNzcY0dVx7wfEfXvQ/fBr2vv4dl5ZqVrCxLEtPPfWUNm3apD179iglJeWmY0pKSiRJffr0kSR5PB698MILOnfunOLj4yVJXq9XLpdLgwcPtmu2bt0asB2v1yuPx3Pd/TidTjmdzkbLo6Kimn2QtmQMQof+N11TfnSy9qoj4H6w3l5bU1vnuGlNU7bT2jU3G9PUce0Nx3940f/wqe/9rfa/WRcPZ2Vl6d///d9VUFCg7t27q7y8XOXl5fr6668lSZ9//rmWLVum4uJinT59Wr/97W81c+ZMjR07VsOGDZMkpaena/DgwXr88cf1n//5n9q+fbuee+45ZWVl2cHkySef1H/913/pmWee0Z/+9Cf9/Oc/13vvvaenn376lh4sAAAwW7OCzZtvvqmqqiqNGzdOffr0sW8bN26UJEVHR2vnzp1KT0/XwIED9eMf/1hTp07Vhx9+aG8jMjJSmzdvVmRkpDwej77//e9r5syZWrp0qV2TkpKiLVu2yOv1avjw4XrllVf09ttv81FvAABwQ81+K+pGkpKSVFhYeNPtJCcnN3qrqaFx48bpyJEjzZkeANwQvycFmI/figIAAMYg2AAAAGMQbAAAgDEINgAAwBgt/kkFAK2rKd9RAwAIxBkbAABgDM7YAEAz8bFxoP3ijA0AADAGwQYAABiDYAMAAIxBsAEAAMYg2AAAAGPwqSgAuEaoPvHEJ6eA8OCMDQAAMAbBBgAAGINgAwAAjEGwAQAAxiDYAAAAYxBsAACAMQg2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYBBsAAGAMgg0AADAGwQYAABiDYAMAAIxBsAEAAMYg2AAAAGMQbAAAgDEINgAAwBidwj0BAOio+i/cYv/ZGWlp5egwTgYwBMEGaGXX/uNV7/SKzDDMBADMx1tRAADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYBBsAAGAMgg0AADAGwQYAABiDYAMAAIxBsAEAAMYg2AAAAGMQbAAAgDEINgAAwBjNCjbLly/Xfffdp+7duys+Pl5TpkxRaWlpQM2lS5eUlZWlXr16qVu3bpo6daoqKioCasrKypSZmamYmBjFx8drwYIFunLlSkDNnj17dO+998rpdOquu+5Sfn5+yx4hANzG+i/c0ugG4PqaFWwKCwuVlZWlAwcOyOv1yu/3Kz09XdXV1XbN008/rQ8//FDvv/++CgsLdebMGT366KP2+qtXryozM1OXL1/W/v37tW7dOuXn52vRokV2zalTp5SZmanx48erpKRE8+fP1w9/+ENt3749BA8ZAACYqlNzirdt2xZwPz8/X/Hx8SouLtbYsWNVVVWlX/7ylyooKNCDDz4oSXr33Xc1aNAgHThwQGPGjNGOHTt04sQJ7dy5UwkJCRoxYoSWLVumZ599Vnl5eYqOjtbatWuVkpKiV155RZI0aNAg7du3T6+++qoyMjJC9NABAIBpmhVsGqqqqpIk9ezZU5JUXFwsv9+vtLQ0u2bgwIHq16+fioqKNGbMGBUVFemee+5RQkKCXZORkaF58+bp+PHj+ru/+zsVFRUFbKO+Zv78+dedS21trWpra+37Pp9PkuT3++X3+5v0eOrrmlqP0DK1/85Iq9GypjzGhuOCjQlljTPimzpnhNXq+wpFzc3GBBvXnmvq+9+S7eDWmfr6czto2PtbfQ4clmU1/lvTBHV1dfqHf/gHVVZWat++fZKkgoICzZ49OyBgSNLo0aM1fvx4vfTSS5o7d66++OKLgLeVampq1LVrV23dulWTJ0/W3XffrdmzZys3N9eu2bp1qzIzM1VTU6MuXbo0mk9eXp6WLFnSaHlBQYFiYmJa8hABAEAbq6mp0fTp01VVVSWXy9Xs8S0+Y5OVlaVjx47ZoSbccnNzlZOTY9/3+XxKSkpSenp6kxvj9/vl9Xo1ceJERUVFtdZUcR2m9n9oXuNrw47l3fwt1Ybjgo0JZY0zwtKyUXV6/nCEihdNCvt8blZzszHBxrXnmvr+Nzz+W3r8oHlMff25HTTsff07Li3VomCTnZ2tzZs3a+/everbt6+93O126/Lly6qsrFRcXJy9vKKiQm632645dOhQwPbqPzV1bU3DT1JVVFTI5XIFPVsjSU6nU06ns9HyqKioZh+kLRmD0DGt/7VXHY2WNeXxNRwXbExr1NTWOdpsX7dSc7MxwcbdLjXX1rX0+EHLmPb6czup7/2t9r9Zn4qyLEvZ2dnatGmTdu/erZSUlID1I0eOVFRUlHbt2mUvKy0tVVlZmTwejyTJ4/Hok08+0blz5+war9crl8ulwYMH2zXXbqO+pn4bAAAAwTTrjE1WVpYKCgr0m9/8Rt27d1d5ebkkKTY2Vl26dFFsbKzmzJmjnJwc9ezZUy6XS0899ZQ8Ho/GjBkjSUpPT9fgwYP1+OOPa+XKlSovL9dzzz2nrKws+4zLk08+qZ/97Gd65pln9IMf/EC7d+/We++9py1b+P4GAABwfc06Y/Pmm2+qqqpK48aNU58+fezbxo0b7ZpXX31V3/3udzV16lSNHTtWbrdbv/71r+31kZGR2rx5syIjI+XxePT9739fM2fO1NKlS+2alJQUbdmyRV6vV8OHD9crr7yit99+m496AwCAG2rWGZumfICqc+fOWrNmjdasWXPdmuTkZG3duvWG2xk3bpyOHDnSnOkBAIAOjt+KAgAAxiDYAAAAYxBsAACAMQg2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYBBsAAGAMgg0AADAGwQYAABijU7gnANzO+i/c0mjZ6RWZYZgJAEDijA0AADAIwQYAABiDYAMAAIxBsAEAAMYg2AAAAGMQbAAAgDEINgAAwBgEGwAAYAyCDQAAMAbBBgAAGIOfVACA2xw/7QH8FWdsAACAMQg2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYBBsAAGAMgg0AADAGwQYAABiDYAMAAIxBsAEAAMYg2AAAAGMQbAAAgDEINgAAwBgEGwAAYAyCDQAAMAbBBgAAGINgAwAAjEGwAQAAxugU7gkAAMKj/8ItjZadXpEZhpkAocMZGwAAYAyCDQAAMAbBBgAAGINgAwAAjNHsYLN371499NBDSkxMlMPh0AcffBCw/p/+6Z/kcDgCbpMmTQqoOX/+vGbMmCGXy6W4uDjNmTNHFy9eDKg5evSoHnjgAXXu3FlJSUlauXJl8x8dAADoUJodbKqrqzV8+HCtWbPmujWTJk3S2bNn7duvfvWrgPUzZszQ8ePH5fV6tXnzZu3du1dz58611/t8PqWnpys5OVnFxcV6+eWXlZeXp1/84hfNnS4AAOhAmv1x78mTJ2vy5Mk3rHE6nXK73UHXffrpp9q2bZs+/vhjjRo1SpL0xhtv6Dvf+Y5++tOfKjExUevXr9fly5f1zjvvKDo6WkOGDFFJSYlWrVoVEIAAAACu1SrfY7Nnzx7Fx8erR48eevDBB/WTn/xEvXr1kiQVFRUpLi7ODjWSlJaWpoiICB08eFCPPPKIioqKNHbsWEVHR9s1GRkZeumll/SXv/xFPXr0aLTP2tpa1dbW2vd9Pp8kye/3y+/3N2ne9XVNrUdo3Y79d0ZajZY1nH9Tapqy7WBjQlnjjPimzhlhtfq+QlFzszHBxrXnmvr+t9a+gmnpOBPdjq8/pmjY+1t9DhyWZTU+sps62OHQpk2bNGXKFHvZhg0bFBMTo5SUFH3++ef613/9V3Xr1k1FRUWKjIzUiy++qHXr1qm0tDRgW/Hx8VqyZInmzZun9PR0paSk6K233rLXnzhxQkOGDNGJEyc0aNCgRnPJy8vTkiVLGi0vKChQTExMSx8iAABoQzU1NZo+fbqqqqrkcrmaPT7kZ2ymTZtm//mee+7RsGHD9K1vfUt79uzRhAkTQr07W25urnJycuz7Pp9PSUlJSk9Pb3Jj/H6/vF6vJk6cqKioqNaaKq7jduz/0LztjZYdy8todk1Tth1sTChrnBGWlo2q0/OHI1S8aFLQmracz81qbjYm2Lj2XFPf/4bHf1seY00dZ6Lb8fXHFA17X/+OS0u1+k8q3Hnnnerdu7dOnjypCRMmyO1269y5cwE1V65c0fnz5+3rctxutyoqKgJq6u9f79odp9Mpp9PZaHlUVFSzD9KWjEHo3E79r73qaLSs4dybUtOUbQcb0xo1tXWONtvXrdTcbEywcbdLzbV1bXmMNXWcyW6n1x/T1Pf+Vvvf6t9j8+c//1lfffWV+vTpI0nyeDyqrKxUcXGxXbN7927V1dUpNTXVrtm7d2/A+2xer1cDBgwIen0NAACA1IJgc/HiRZWUlKikpESSdOrUKZWUlKisrEwXL17UggULdODAAZ0+fVq7du3Sww8/rLvuuksZGd+c3hw0aJAmTZqkJ554QocOHdJHH32k7OxsTZs2TYmJiZKk6dOnKzo6WnPmzNHx48e1ceNGvf766wFvNQEAADTU7LeiDh8+rPHjx9v368PGrFmz9Oabb+ro0aNat26dKisrlZiYqPT0dC1btizgbaL169crOztbEyZMUEREhKZOnarVq1fb62NjY7Vjxw5lZWVp5MiR6t27txYtWsRHvdGm+OVjALj9NDvYjBs3Tjf6INX27Y0vRmuoZ8+eKigouGHNsGHD9Ic//KG50wMAAB0YvxUFAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYBBsAAGAMgg0AADAGwQYAABiDYAMAAIxBsAEAAMYg2AAAAGMQbAAAgDEINgAAwBgEGwAAYAyCDQAAMAbBBgAAGINgAwAAjEGwAQAAxiDYAAAAYxBsAACAMQg2AADAGAQbAABgDIINAAAwRqdwTwAA0H71X7il0bLTKzLDMBOgaThjAwAAjEGwAQAAxiDYAAAAYxBsAACAMQg2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYBBsAAGAMgg0AADAGwQYAABiDYAMAAIxBsAEAAMboFO4JAOHQf+GWRstOr8gMw0wAAKHEGRsAAGAMgg0AADAGwQYAABiDYAMAAIxBsAEAAMbgU1EAgFvCpwzRnnDGBgAAGINgAwAAjEGwAQAAxiDYAAAAYxBsAACAMQg2AADAGM0ONnv37tVDDz2kxMREORwOffDBBwHrLcvSokWL1KdPH3Xp0kVpaWn67LPPAmrOnz+vGTNmyOVyKS4uTnPmzNHFixcDao4ePaoHHnhAnTt3VlJSklauXNn8RwcAADqUZgeb6upqDR8+XGvWrAm6fuXKlVq9erXWrl2rgwcPqmvXrsrIyNClS5fsmhkzZuj48ePyer3avHmz9u7dq7lz59rrfT6f0tPTlZycrOLiYr388svKy8vTL37xixY8RAAA0FE0+wv6Jk+erMmTJwddZ1mWXnvtNT333HN6+OGHJUn/9m//poSEBH3wwQeaNm2aPv30U23btk0ff/yxRo0aJUl644039J3vfEc//elPlZiYqPXr1+vy5ct65513FB0drSFDhqikpESrVq0KCEAAAADXCuk3D586dUrl5eVKS0uzl8XGxio1NVVFRUWaNm2aioqKFBcXZ4caSUpLS1NERIQOHjyoRx55REVFRRo7dqyio6PtmoyMDL300kv6y1/+oh49ejTad21trWpra+37Pp9PkuT3++X3+5s0//q6ptYjtNqy/85I67r7D0dNU+YYbEwoa5wR39Q5I6xW31coam42Jti49lxT3/9wHmNtvf/2hNf/8GnY+1t9DhyWZTU+Ips62OHQpk2bNGXKFEnS/v37df/99+vMmTPq06ePXfeP//iPcjgc2rhxo1588UWtW7dOpaWlAduKj4/XkiVLNG/ePKWnpyslJUVvvfWWvf7EiRMaMmSITpw4oUGDBjWaS15enpYsWdJoeUFBgWJiYlr6EAEAQBuqqanR9OnTVVVVJZfL1ezxxvxWVG5urnJycuz7Pp9PSUlJSk9Pb3Jj/H6/vF6vJk6cqKioqNaaKq6jLfs/NG97o2XH8jLCVtOUOQYbE8oaZ4SlZaPq9PzhCBUvmhT2+dys5mZjgo1rzzX1/W94/LflMdbSbbd0/+0Jr//h07D39e+4tFRIg43b7ZYkVVRUBJyxqaio0IgRI+yac+fOBYy7cuWKzp8/b493u92qqKgIqKm/X1/TkNPplNPpbLQ8Kiqq2QdpS8YgdNqi/7VXHUH3G66apswx2JjWqKmtc7TZvm6l5mZjgo27XWqurWvLY6yl227p/tsjXv/Dp773t9r/kH6PTUpKitxut3bt2mUv8/l8OnjwoDwejyTJ4/GosrJSxcXFds3u3btVV1en1NRUu2bv3r0B77N5vV4NGDAg6PU1AAAAUguCzcWLF1VSUqKSkhJJ31wwXFJSorKyMjkcDs2fP18/+clP9Nvf/laffPKJZs6cqcTERPs6nEGDBmnSpEl64okndOjQIX300UfKzs7WtGnTlJiYKEmaPn26oqOjNWfOHB0/flwbN27U66+/HvBWEwAAQEPNfivq8OHDGj9+vH2/PmzMmjVL+fn5euaZZ1RdXa25c+eqsrJS3/72t7Vt2zZ17tzZHrN+/XplZ2drwoQJioiI0NSpU7V69Wp7fWxsrHbs2KGsrCyNHDlSvXv31qJFi/ioNwAAuKFmB5tx48bpRh+kcjgcWrp0qZYuXXrdmp49e6qgoOCG+xk2bJj+8Ic/NHd6AACgA+O3ogAAgDEINgAAwBgEGwAAYAyCDQAAMAbBBgAAGINgAwAAjEGwAQAAxiDYAAAAYxBsAACAMQg2AADAGM3+SQWgveu/cEujZadXZIZhJgCAtsYZGwAAYAyCDQAAMAbBBgAAGINrbAAArY5r39BWOGMDAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYBBsAAGAMgg0AADAGwQYAABiDYAMAAIxBsAEAAMYg2AAAAGMQbAAAgDEINgAAwBgEGwAAYAyCDQAAMAbBBgAAGINgAwAAjEGwAQAAxiDYAAAAYxBsAACAMQg2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAxOoV7AgAASFL/hVsaLTu9IjMMM8HtjDM2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAx+II+3Fb4Ai8AwI1wxgYAABgj5MEmLy9PDocj4DZw4EB7/aVLl5SVlaVevXqpW7dumjp1qioqKgK2UVZWpszMTMXExCg+Pl4LFizQlStXQj1VAABgmFZ5K2rIkCHauXPnX3fS6a+7efrpp7Vlyxa9//77io2NVXZ2th599FF99NFHkqSrV68qMzNTbrdb+/fv19mzZzVz5kxFRUXpxRdfbI3pAgAAQ7RKsOnUqZPcbnej5VVVVfrlL3+pgoICPfjgg5Kkd999V4MGDdKBAwc0ZswY7dixQydOnNDOnTuVkJCgESNGaNmyZXr22WeVl5en6Ojo1pgyAAAwQKtcY/PZZ58pMTFRd955p2bMmKGysjJJUnFxsfx+v9LS0uzagQMHql+/fioqKpIkFRUV6Z577lFCQoJdk5GRIZ/Pp+PHj7fGdAEAgCFCfsYmNTVV+fn5GjBggM6ePaslS5bogQce0LFjx1ReXq7o6GjFxcUFjElISFB5ebkkqby8PCDU1K+vX3c9tbW1qq2tte/7fD5Jkt/vl9/vb9Lc6+uaWo/Qakr/nZHWdcfdzjXBNBwXbEwoa5wR39Q5I6xW31coam42Jti49lxT3/9wHmOtuf/WfByhwOt/+DTs/a0+Bw7LshofSSFUWVmp5ORkrVq1Sl26dNHs2bMDAogkjR49WuPHj9dLL72kuXPn6osvvtD27dvt9TU1Neratau2bt2qyZMnB91PXl6elixZ0mh5QUGBYmJiQvugAABAq6ipqdH06dNVVVUll8vV7PGt/j02cXFxuvvuu3Xy5ElNnDhRly9fVmVlZcBZm4qKCvuaHLfbrUOHDgVso/5TU8Gu26mXm5urnJwc+77P51NSUpLS09Ob3Bi/3y+v16uJEycqKiqqqQ8RIdKU/g/N295o2bG8jNu+JpiG44KNCWWNM8LSslF1ev5whIoXTQr7fG5Wc7Mxwca155r6/jc8/tvyGGvptsP9dyUUeP0Pn4a9r3/HpaVaPdhcvHhRn3/+uR5//HGNHDlSUVFR2rVrl6ZOnSpJKi0tVVlZmTwejyTJ4/HohRde0Llz5xQfHy9J8nq9crlcGjx48HX343Q65XQ6Gy2Piopq9kHakjEInRv1v/aqI2j97V4TTMNxwca0Rk1tnaPN9nUrNTcbE2zc7VJzbV1bHmMt3Xa4/66EEq//4VPf+1vtf8iDzb/8y7/ooYceUnJyss6cOaPFixcrMjJS3/ve9xQbG6s5c+YoJydHPXv2lMvl0lNPPSWPx6MxY8ZIktLT0zV48GA9/vjjWrlypcrLy/Xcc88pKysraHABAHQcfPs4bibkwebPf/6zvve97+mrr77SHXfcoW9/+9s6cOCA7rjjDknSq6++qoiICE2dOlW1tbXKyMjQz3/+c3t8ZGSkNm/erHnz5snj8ahr166aNWuWli5dGuqpAgAAw4Q82GzYsOGG6zt37qw1a9ZozZo1161JTk7W1q1bQz01AABgOH4rCgAAGINgAwAAjEGwAQAAxiDYAAAAYxBsAACAMQg2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACM0eq/7g001dC87Vo5+pv/1v/KLz9uBwBoDs7YAAAAYxBsAACAMQg2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMwffYAACM0n/hlkbL+E6sjoMzNgAAwBgEGwAAYAyCDQAAMAbBBgAAGINgAwAAjEGwAQAAxiDYAAAAYxBsAACAMQg2AADAGAQbAABgDIINAAAwBsEGAAAYg2ADAACMwa97AwA6nIa/AO6MtLRydJgmg5DijA0AADAGwQYAABiDYAMAAIzBNTZoEw3fz5ak0ysywzATAIDJOGMDAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYfCoKAIAmavgJTz7d2f5wxgYAABiDYAMAAIxBsAEAAMYg2AAAAGNw8TCajYvnAADtFWdsAACAMQg2AADAGLwVBQBACPF2fXhxxgYAABiDMzYdRMP/g5D4vwgAgHkINgjAKVQAwO2MYBNGoTqLwtkYALi98D+RraddB5s1a9bo5ZdfVnl5uYYPH6433nhDo0ePDve02hShBQCApmu3wWbjxo3KycnR2rVrlZqaqtdee00ZGRkqLS1VfHx8uKcHAECr4qxOy7TbYLNq1So98cQTmj17tiRp7dq12rJli9555x0tXLgwzLO7Oc60AABaG+GnsXYZbC5fvqzi4mLl5ubayyIiIpSWlqaioqKgY2pra1VbW2vfr6qqkiSdP39efr+/Sfv1+/2qqanRV199paioqOvWpS7f1WjZwdwJAfc7XaluVPPVV1+165pgdS2tudmYoHP0V6umpk6d/BG6WucIXtPOehbK3jcUqueiqTWd6iy7/629r1DU3GxMsHHtuaa+/w1ff9ryGGvptk2ouV7/G2pvfw9a8nelvWn4b++FCxckSZZltWyDVjv03//935Yka//+/QHLFyxYYI0ePTromMWLF1uSuHHjxo0bN24G3L788ssWZYh2ecamJXJzc5WTk2Pfr6ur0/nz59WrVy85HI4mbcPn8ykpKUlffvmlXC5Xa00V10H/w4v+hxf9Dy/6Hz4Ne29Zli5cuKDExMQWba9dBpvevXsrMjJSFRUVAcsrKirkdruDjnE6nXI6nQHL4uLiWrR/l8vFgR1G9D+86H940f/wov/hc23vY2NjW7yddvmTCtHR0Ro5cqR27frrtSx1dXXatWuXPB5PGGcGAADas3Z5xkaScnJyNGvWLI0aNUqjR4/Wa6+9purqavtTUgAAAA2122Dz2GOP6X/+53+0aNEilZeXa8SIEdq2bZsSEhJabZ9Op1OLFy9u9JYW2gb9Dy/6H170P7zof/iEuvcOy2rp56kAAADal3Z5jQ0AAEBLEGwAAIAxCDYAAMAYBBsAAGAMgs3/W7Nmjfr376/OnTsrNTVVhw4dCveUjLR371499NBDSkxMlMPh0AcffBCw3rIsLVq0SH369FGXLl2Ulpamzz77LDyTNdDy5ct13333qXv37oqPj9eUKVNUWloaUHPp0iVlZWWpV69e6tatm6ZOndroyzLRMm+++aaGDRtmfxGZx+PR7373O3s9vW87K1askMPh0Pz58+1l9L915eXlyeFwBNwGDhxorw9V/wk2kjZu3KicnBwtXrxYf/zjHzV8+HBlZGTo3Llz4Z6acaqrqzV8+HCtWbMm6PqVK1dq9erVWrt2rQ4ePKiuXbsqIyNDly5dauOZmqmwsFBZWVk6cOCAvF6v/H6/0tPTVV391x/Se/rpp/Xhhx/q/fffV2Fhoc6cOaNHH300jLM2R9++fbVixQoVFxfr8OHDevDBB/Xwww/r+PHjkuh9W/n444/11ltvadiwYQHL6X/rGzJkiM6ePWvf9u3bZ68LWf9b9AtThhk9erSVlZVl37969aqVmJhoLV++PIyzMp8ka9OmTfb9uro6y+12Wy+//LK9rLKy0nI6ndavfvWrMMzQfOfOnbMkWYWFhZZlfdPvqKgo6/3337drPv30U0uSVVRUFK5pGq1Hjx7W22+/Te/byIULF6y//du/tbxer/X3f//31o9+9CPLsjj228LixYut4cOHB10Xyv53+DM2ly9fVnFxsdLS0uxlERERSktLU1FRURhn1vGcOnVK5eXlAc9FbGysUlNTeS5aSVVVlSSpZ8+ekqTi4mL5/f6A52DgwIHq168fz0GIXb16VRs2bFB1dbU8Hg+9byNZWVnKzMwM6LPEsd9WPvvsMyUmJurOO+/UjBkzVFZWJim0/W+33zzcVv73f/9XV69ebfSNxgkJCfrTn/4Upll1TOXl5ZIU9LmoX4fQqaur0/z583X//fdr6NChkr55DqKjoxv9gCzPQeh88skn8ng8unTpkrp166ZNmzZp8ODBKikpofetbMOGDfrjH/+ojz/+uNE6jv3Wl5qaqvz8fA0YMEBnz57VkiVL9MADD+jYsWMh7X+HDzZAR5WVlaVjx44FvMeN1jdgwACVlJSoqqpK//Ef/6FZs2apsLAw3NMy3pdffqkf/ehH8nq96ty5c7in0yFNnjzZ/vOwYcOUmpqq5ORkvffee+rSpUvI9tPh34rq3bu3IiMjG115XVFRIbfbHaZZdUz1/ea5aH3Z2dnavHmzfv/736tv3772crfbrcuXL6uysjKgnucgdKKjo3XXXXdp5MiRWr58uYYPH67XX3+d3rey4uJinTt3Tvfee686deqkTp06qbCwUKtXr1anTp2UkJBA/9tYXFyc7r77bp08eTKkx3+HDzbR0dEaOXKkdu3aZS+rq6vTrl275PF4wjizjiclJUVutzvgufD5fDp48CDPRYhYlqXs7Gxt2rRJu3fvVkpKSsD6kSNHKioqKuA5KC0tVVlZGc9BK6mrq1NtbS29b2UTJkzQJ598opKSEvs2atQozZgxw/4z/W9bFy9e1Oeff64+ffqE9vi/hQucjbFhwwbL6XRa+fn51okTJ6y5c+dacXFxVnl5ebinZpwLFy5YR44csY4cOWJJslatWmUdOXLE+uKLLyzLsqwVK1ZYcXFx1m9+8xvr6NGj1sMPP2ylpKRYX3/9dZhnboZ58+ZZsbGx1p49e6yzZ8/at5qaGrvmySeftPr162ft3r3bOnz4sOXxeCyPxxPGWZtj4cKFVmFhoXXq1Cnr6NGj1sKFCy2Hw2Ht2LHDsix639au/VSUZdH/1vbjH//Y2rNnj3Xq1Cnro48+stLS0qzevXtb586dsywrdP0n2Py/N954w+rXr58VHR1tjR492jpw4EC4p2Sk3//+95akRrdZs2ZZlvXNR76ff/55KyEhwXI6ndaECROs0tLS8E7aIMF6L8l699137Zqvv/7a+ud//merR48eVkxMjPXII49YZ8+eDd+kDfKDH/zASk5OtqKjo6077rjDmjBhgh1qLIvet7WGwYb+t67HHnvM6tOnjxUdHW39zd/8jfXYY49ZJ0+etNeHqv8Oy7KsEJxRAgAACLsOf40NAAAwB8EGAAAYg2ADAACMQbABAADGINgAAABjEGwAAIAxCDYAAMAYBBsAAGAMgg0AADAGwQYAABiDYAMAAIxBsAEAAMb4P8F61K6fVtr6AAAAAElFTkSuQmCC",
                        "text/plain": [
                            "<Figure size 640x480 with 1 Axes>"
                        ]
                    },
                    "metadata": {},
                    "output_type": "display_data"
                }
            ],
            "source": [
                "df_var_num.hist(bins=100)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 25,
            "id": "f2f8baff",
            "metadata": {},
            "outputs": [
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "ids_selected_by_vars:  (53935,)\n"
                    ]
                }
            ],
            "source": [
                "ids_selected_by_vars = df_var_num.loc[df_var_num >= 10].index\n",
                "\n",
                "print(\"ids_selected_by_vars: \", ids_selected_by_vars.shape)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 26,
            "id": "33139d2e",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "22597"
                        ]
                    },
                    "execution_count": 26,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "ids_selected = set(ids_before_selected) & set(ids_after_selected) & set(ids_selected_by_vars)\n",
                "len(ids_selected)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "id": "92e6f7e2",
            "metadata": {},
            "outputs": [],
            "source": [
                "\n",
                "complete_df = complete_df.loc[list(ids_selected)]"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 53,
            "id": "b79f6639",
            "metadata": {},
            "outputs": [],
            "source": [
                "complete_df.to_csv(\n",
                "    path_m4/'processed/mimic4_full_dataset.csv')"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "id": "94f80aae",
            "metadata": {},
            "outputs": [],
            "source": []
        }
    ],
    "metadata": {
        "kernelspec": {
            "display_name": "GNeuralFlow",
            "language": "python",
            "name": "python3"
        },
        "language_info": {
            "codemirror_mode": {
                "name": "ipython",
                "version": 3
            },
            "file_extension": ".py",
            "mimetype": "text/x-python",
            "name": "python",
            "nbconvert_exporter": "python",
            "pygments_lexer": "ipython3",
            "version": "3.10.16"
        }
    },
    "nbformat": 4,
    "nbformat_minor": 5
}
