{
    "cells": [
        {
            "cell_type": "code",
            "execution_count": 1,
            "id": "0e16786e",
            "metadata": {},
            "outputs": [],
            "source": [
                "import os\n",
                "from pathlib import Path\n",
                "import numpy as np\n",
                "import pandas as pd\n",
                "from datetime import timedelta\n",
                "\n",
                "# p_project = Path(__file__).parents[2]\n",
                "p_project = Path(os.getcwd()).parents[1]\n",
                "path_m4 = p_project/'data/mimic4'"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 5,
            "id": "c8c64cf0",
            "metadata": {},
            "outputs": [
                {
                    "name": "stderr",
                    "output_type": "stream",
                    "text": [
                        "/tmp/ipykernel_761391/4199856774.py:7: DtypeWarning: Columns (12) have mixed types. Specify dtype option on import or set low_memory=False.\n",
                        "  inputs_df = pd.read_csv(path_m4/'processed/tables/inputs_processed.csv')[\n",
                        "/tmp/ipykernel_761391/4199856774.py:11: DtypeWarning: Columns (8,11,14) have mixed types. Specify dtype option on import or set low_memory=False.\n",
                        "  presc_df = pd.read_csv(path_m4/'processed/tables/prescriptions_processed.csv')[\n"
                    ]
                }
            ],
            "source": [
                "lab_df = pd.read_csv(path_m4/'processed/tables/lab_processed.csv')[\n",
                "    ['subject_id', 'hadm_id', 'charttime', 'valuenum', 'label']]\n",
                "inputs_df = pd.read_csv(path_m4/'processed/tables/inputs_processed.csv')[\n",
                "    ['subject_id', 'hadm_id', 'charttime', 'amount', 'label']]\n",
                "outputs_df = pd.read_csv(path_m4/'processed/tables/outputs_processed.csv')[\n",
                "    ['subject_id', 'hadm_id', 'charttime', 'value', 'label']]\n",
                "presc_df = pd.read_csv(path_m4/'processed/tables/prescriptions_processed.csv')[\n",
                "    ['subject_id', 'hadm_id', 'charttime', 'dose_val_rx', 'drug']]\n",
                "\n",
                "# Change the name of amount. Valuenum for every table\n",
                "inputs_df['valuenum'] = inputs_df['amount']\n",
                "inputs_df = inputs_df.drop(columns=['amount']).copy()\n",
                "\n",
                "outputs_df['valuenum'] = outputs_df['value']\n",
                "outputs_df = outputs_df.drop(columns=['value']).copy()\n",
                "\n",
                "presc_df['valuenum'] = presc_df['dose_val_rx']\n",
                "presc_df = presc_df.drop(columns=['dose_val_rx']).copy()\n",
                "presc_df['label'] = presc_df['drug']\n",
                "presc_df = presc_df.drop(columns=['drug']).copy()\n",
                "\n",
                "# Tag to distinguish between lab and inputs events\n",
                "inputs_df['Origin'] = 'Inputs'\n",
                "lab_df['Origin'] = 'Lab'\n",
                "outputs_df['Origin'] = 'Outputs'\n",
                "presc_df['Origin'] = 'Prescriptions'\n",
                "\n",
                "merged_df = pd.concat((inputs_df, lab_df, outputs_df, presc_df)).reset_index()\n",
                "\n",
                "# Check that all labels have different names.\n",
                "assert(merged_df['label'].nunique() == (inputs_df['label'].nunique(\n",
                ")+lab_df['label'].nunique()+outputs_df['label'].nunique()+presc_df['label'].nunique()))"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "id": "95861979",
            "metadata": {},
            "outputs": [],
            "source": [
                "# set the timestamp as the time delta between the first chart time for each admission\n",
                "merged_df['charttime'] = pd.to_datetime(\n",
                "    merged_df['charttime'], format='%Y-%m-%d %H:%M:%S')\n",
                "ref_time = merged_df.groupby('hadm_id')['charttime'].min()\n",
                "merged_df_1 = pd.merge(ref_time.to_frame(name='ref_time'),\n",
                "                       merged_df, left_index=True, right_on='hadm_id')\n",
                "merged_df_1['time_stamp'] = merged_df_1['charttime']-merged_df_1['ref_time']\n",
                "assert(len(merged_df_1.loc[merged_df_1['time_stamp']\n",
                "       < timedelta(hours=0)].index) == 0)\n",
                "\n",
                "# Create a label code (int) for the labels.\n",
                "label_dict = dict(zip(list(merged_df_1['label'].unique()), range(\n",
                "    len(list(merged_df_1['label'].unique())))))\n",
                "merged_df_1['label_code'] = merged_df_1['label'].map(label_dict)\n",
                "\n",
                "label_dict_df = pd.Series(merged_df_1['label'].unique()).reset_index()\n",
                "label_dict_df.columns = ['index', 'label']\n",
                "label_dict_df['label_code'] = label_dict_df['label'].map(label_dict)\n",
                "label_dict_df.drop(columns=['index'], inplace=True)\n",
                "label_dict_df.to_csv(path_m4/'processed/tables/variable_name_dict.csv')\n",
                "\n",
                "merged_df_short = merged_df_1[['hadm_id', 'valuenum', 'time_stamp', 'label_code']].rename(\n",
                "    columns={'hadm_id': 'ID', 'time_stamp': 'Time'})\n",
                "\n",
                "# select patients who have records in both the first 24 hours and the second 24 hours\n",
                "ids_before_24 = merged_df_short.loc[(\n",
                "    merged_df_short['Time'] < timedelta(hours=24))]['ID'].unique()\n",
                "\n",
                "ids_after_24 = merged_df_short.loc[(merged_df_short['Time'] >= timedelta(hours=24)) &\n",
                "                                   (merged_df_short['Time'] < timedelta(hours=48))]['ID'].unique()\n",
                "\n",
                "merged_df_short = merged_df_short.loc[merged_df_short['ID'].isin(\n",
                "    set(ids_before_24) & set(ids_after_24))]\n",
                "\n",
                "# select 48h records\n",
                "merged_df_short = merged_df_short.loc[merged_df_short['Time'] < timedelta(\n",
                "    hours=48)]\n",
                "\n",
                "# The sampling interval is 1 minute\n",
                "merged_df_short['Time'] = merged_df_short['Time'].dt.total_seconds().div(\n",
                "    60).astype(int)\n",
                "assert(len(merged_df_short.loc[merged_df_short['Time'] > 2880].index) == 0)\n",
                "\n",
                "value_df = pd.pivot_table(merged_df_short, values='valuenum', index=[\n",
                "                          'ID', 'Time'], columns=['label_code'], aggfunc=np.max)\n",
                "mask_df = value_df.notna()\n",
                "\n",
                "d_values = {}\n",
                "d_masks = {}\n",
                "for i in value_df.columns:\n",
                "    d_values[i] = \"Value_\" + str(i)\n",
                "    d_masks[i] = \"Mask_\" + str(i)\n",
                "\n",
                "value_df.rename(columns=d_values, inplace=True)\n",
                "mask_df.rename(columns=d_masks, inplace=True)\n",
                "\n",
                "value_df.fillna(0, inplace=True)\n",
                "mask_df = mask_df.astype(int)\n",
                "\n",
                "complete_df = pd.concat((value_df, mask_df), axis=1).reset_index()\n",
                "\n",
                "complete_df['ID'] = complete_df['ID'].astype(int)\n",
                "\n",
                "complete_df.sort_values([\"ID\", \"Time\"], inplace=True)\n"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 2,
            "id": "0190afa5",
            "metadata": {},
            "outputs": [],
            "source": [
                "complete_df = pd.read_csv(path_m4/'processed/mimic4_full_dataset.csv', index_col=0)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "id": "e964afc9",
            "metadata": {},
            "outputs": [],
            "source": []
        },
        {
            "cell_type": "code",
            "execution_count": 3,
            "id": "7c173967",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/html": [
                            "<div>\n",
                            "<style scoped>\n",
                            "    .dataframe tbody tr th:only-of-type {\n",
                            "        vertical-align: middle;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe tbody tr th {\n",
                            "        vertical-align: top;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe thead th {\n",
                            "        text-align: right;\n",
                            "    }\n",
                            "</style>\n",
                            "<table border=\"1\" class=\"dataframe\">\n",
                            "  <thead>\n",
                            "    <tr style=\"text-align: right;\">\n",
                            "      <th></th>\n",
                            "      <th>Time</th>\n",
                            "      <th>Value_0</th>\n",
                            "      <th>Value_1</th>\n",
                            "      <th>Value_2</th>\n",
                            "      <th>Value_3</th>\n",
                            "      <th>Value_4</th>\n",
                            "      <th>Value_5</th>\n",
                            "      <th>Value_6</th>\n",
                            "      <th>Value_7</th>\n",
                            "      <th>Value_8</th>\n",
                            "      <th>...</th>\n",
                            "      <th>Mask_86</th>\n",
                            "      <th>Mask_87</th>\n",
                            "      <th>Mask_88</th>\n",
                            "      <th>Mask_89</th>\n",
                            "      <th>Mask_90</th>\n",
                            "      <th>Mask_91</th>\n",
                            "      <th>Mask_92</th>\n",
                            "      <th>Mask_93</th>\n",
                            "      <th>Mask_94</th>\n",
                            "      <th>Mask_95</th>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>ID</th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "    </tr>\n",
                            "  </thead>\n",
                            "  <tbody>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>578</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>599</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>693</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>720</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>0.0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "  </tbody>\n",
                            "</table>\n",
                            "<p>5 rows × 193 columns</p>\n",
                            "</div>"
                        ],
                        "text/plain": [
                            "          Time  Value_0  Value_1  Value_2  Value_3  Value_4  Value_5  Value_6  \\\n",
                            "ID                                                                              \n",
                            "20000147     0      0.0      0.0      0.0      0.0      0.0      0.0      0.0   \n",
                            "20000147   578      0.0      0.0      0.0      0.0      0.0      0.0      0.0   \n",
                            "20000147   599      0.0      0.0      0.0      0.0      0.0      0.0      0.0   \n",
                            "20000147   693      0.0      0.0      0.0      0.0      0.0      0.0      0.0   \n",
                            "20000147   720      0.0      0.0      0.0      0.0      0.0      0.0      0.0   \n",
                            "\n",
                            "          Value_7  Value_8  ...  Mask_86  Mask_87  Mask_88  Mask_89  Mask_90  \\\n",
                            "ID                          ...                                                \n",
                            "20000147      0.0      0.0  ...        0        0        0        0        0   \n",
                            "20000147      0.0      0.0  ...        0        0        0        0        0   \n",
                            "20000147      0.0      0.0  ...        0        0        0        0        0   \n",
                            "20000147      0.0      0.0  ...        0        0        0        0        0   \n",
                            "20000147      0.0      0.0  ...        0        0        0        0        0   \n",
                            "\n",
                            "          Mask_91  Mask_92  Mask_93  Mask_94  Mask_95  \n",
                            "ID                                                     \n",
                            "20000147        0        0        0        0        0  \n",
                            "20000147        0        0        0        0        0  \n",
                            "20000147        0        0        0        0        0  \n",
                            "20000147        0        0        0        0        0  \n",
                            "20000147        0        0        0        0        0  \n",
                            "\n",
                            "[5 rows x 193 columns]"
                        ]
                    },
                    "execution_count": 3,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "complete_df.head()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 9,
            "id": "d7423fd5",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "(5670039, 193)"
                        ]
                    },
                    "execution_count": 9,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "complete_df.shape"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 10,
            "id": "be2bd4dc",
            "metadata": {},
            "outputs": [],
            "source": [
                "# Calculate the standard deviation of elements along the axis 0. \n",
                "# Turn elements out of 5 times of the standard deviation into 0.\n",
                "def remove_outlier(data, mask, threshold=5):\n",
                "    mean = np.mean(data, axis=0)\n",
                "    std = np.std(data, axis=0)\n",
                "    mask_outlier = abs(data - mean) > threshold * std\n",
                "    data = np.where(mask_outlier, 0, data)\n",
                "    mask = np.where(mask_outlier, 0, mask)\n",
                "    return data, mask\n",
                "\n",
                "value_cols = []\n",
                "mask_cols = []\n",
                "for col in complete_df.columns:\n",
                "    value_cols.append(col.startswith(\"Value\"))\n",
                "    mask_cols.append(col.startswith(\"Mask\"))\n",
                "\n",
                "value = complete_df.loc[:, value_cols].values\n",
                "mask = complete_df.loc[:, mask_cols].values\n",
                "value_new, mask_new = remove_outlier(value, mask)\n",
                "complete_df.loc[:, value_cols] = value_new\n",
                "complete_df.loc[:, mask_cols] = mask_new\n",
                "complete_df = complete_df.loc[complete_df.loc[:, mask_cols].sum(axis=1) > 0]"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 12,
            "id": "5d5987d3",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "(4928645, 193)"
                        ]
                    },
                    "execution_count": 12,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "complete_df.shape"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 15,
            "id": "32b45828",
            "metadata": {},
            "outputs": [],
            "source": [
                "Mask_df = complete_df.filter(regex='^(?!.*Value).*', axis=1) # Exclude columns with Value in the name"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 16,
            "id": "bd54c227",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/html": [
                            "<div>\n",
                            "<style scoped>\n",
                            "    .dataframe tbody tr th:only-of-type {\n",
                            "        vertical-align: middle;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe tbody tr th {\n",
                            "        vertical-align: top;\n",
                            "    }\n",
                            "\n",
                            "    .dataframe thead th {\n",
                            "        text-align: right;\n",
                            "    }\n",
                            "</style>\n",
                            "<table border=\"1\" class=\"dataframe\">\n",
                            "  <thead>\n",
                            "    <tr style=\"text-align: right;\">\n",
                            "      <th></th>\n",
                            "      <th>Time</th>\n",
                            "      <th>Mask_0</th>\n",
                            "      <th>Mask_1</th>\n",
                            "      <th>Mask_2</th>\n",
                            "      <th>Mask_3</th>\n",
                            "      <th>Mask_4</th>\n",
                            "      <th>Mask_5</th>\n",
                            "      <th>Mask_6</th>\n",
                            "      <th>Mask_7</th>\n",
                            "      <th>Mask_8</th>\n",
                            "      <th>...</th>\n",
                            "      <th>Mask_86</th>\n",
                            "      <th>Mask_87</th>\n",
                            "      <th>Mask_88</th>\n",
                            "      <th>Mask_89</th>\n",
                            "      <th>Mask_90</th>\n",
                            "      <th>Mask_91</th>\n",
                            "      <th>Mask_92</th>\n",
                            "      <th>Mask_93</th>\n",
                            "      <th>Mask_94</th>\n",
                            "      <th>Mask_95</th>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>ID</th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "      <th></th>\n",
                            "    </tr>\n",
                            "  </thead>\n",
                            "  <tbody>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>578</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>599</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>693</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>720</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "    <tr>\n",
                            "      <th>20000147</th>\n",
                            "      <td>742</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>...</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "      <td>0</td>\n",
                            "    </tr>\n",
                            "  </tbody>\n",
                            "</table>\n",
                            "<p>5 rows × 97 columns</p>\n",
                            "</div>"
                        ],
                        "text/plain": [
                            "          Time  Mask_0  Mask_1  Mask_2  Mask_3  Mask_4  Mask_5  Mask_6  \\\n",
                            "ID                                                                       \n",
                            "20000147   578       0       0       0       0       0       0       0   \n",
                            "20000147   599       0       0       0       0       0       0       0   \n",
                            "20000147   693       0       0       0       0       0       0       0   \n",
                            "20000147   720       0       0       0       0       0       0       0   \n",
                            "20000147   742       0       0       0       0       0       0       0   \n",
                            "\n",
                            "          Mask_7  Mask_8  ...  Mask_86  Mask_87  Mask_88  Mask_89  Mask_90  \\\n",
                            "ID                        ...                                                \n",
                            "20000147       0       0  ...        0        0        0        0        0   \n",
                            "20000147       0       0  ...        0        0        0        0        0   \n",
                            "20000147       0       0  ...        0        0        0        0        0   \n",
                            "20000147       0       0  ...        0        0        0        0        0   \n",
                            "20000147       0       0  ...        0        0        0        0        0   \n",
                            "\n",
                            "          Mask_91  Mask_92  Mask_93  Mask_94  Mask_95  \n",
                            "ID                                                     \n",
                            "20000147        0        0        0        0        0  \n",
                            "20000147        0        0        0        0        0  \n",
                            "20000147        0        0        0        0        0  \n",
                            "20000147        0        0        0        0        0  \n",
                            "20000147        0        0        0        0        0  \n",
                            "\n",
                            "[5 rows x 97 columns]"
                        ]
                    },
                    "execution_count": 16,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "Mask_df.head()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 17,
            "id": "5e8746aa",
            "metadata": {},
            "outputs": [],
            "source": [
                "tmp_df = Mask_df.groupby('ID').size()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 18,
            "id": "ffe5fb0d",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "<AxesSubplot: >"
                        ]
                    },
                    "execution_count": 18,
                    "metadata": {},
                    "output_type": "execute_result"
                },
                {
                    "data": {
                        "image/png": "iVBORw0KGgoAAAANSUhEUgAABk8AAAGsCAYAAAB0JjBdAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjYuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8o6BhiAAAACXBIWXMAAA9hAAAPYQGoP6dpAAA1sUlEQVR4nO3df5SW9X0n/PcIw/CjMBEoM8yKCSbEmICuiw0OSaMbYNCVkNQ9dRvSqW2smvUni67RuOdk3DXg0lO1CxtrrI026CFPT2M2PyeMTULWQ1AkYYPEQ+2JMdoyYjYwoJBhgtfzRx/v5xpHkEFguG9er3M48b6uz9z39xrezEHf+V5XXVEURQAAAAAAAEiSnDTUCwAAAAAAADieKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFAyfKgXcLS8+uqr+ed//ueMHTs2dXV1Q70cAAAAAABgCBVFkd27d6elpSUnnXTwvSU1W5788z//c6ZMmTLUywAAAAAAAI4jzz//fE455ZSDztRseTJ27Ngk//JNGDdu3BCv5vjQ19eXNWvWpK2tLfX19UO9HDhsskwtkWdqhSxTS+SZWiHL1BJ5plbIMrWkGvO8a9euTJkypdIfHEzNliev3apr3LhxypP/T19fX0aPHp1x48ZVTZjhjcgytUSeqRWyTC2RZ2qFLFNL5JlaIcvUkmrO86E86sMD4wEAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASpQnAAAAAAAAJcoTAAAAAACAEuUJAAAAAABAifIEAAAAAACgRHkCAAAAAABQojwBAAAAAAAoUZ4AAAAAAACUDB/qBXD8ecfN3zzguZ/fcdExXAkAAAAAABx7dp4AAAAAAACUKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASpQnAAAAAAAAJYMqTzo6OlJXV9fvV3Nzc+V8URTp6OhIS0tLRo0alfPPPz9btmzp9x69vb259tprM3HixIwZMyYLFy7MCy+80G9mx44daW9vT2NjYxobG9Pe3p6dO3ce/lUCAAAAAAAcokHvPHnf+96Xbdu2VX5t3ry5cm758uW58847s3LlymzYsCHNzc2ZN29edu/eXZlZvHhxHnnkkaxevTqPPfZYXn755SxYsCD79++vzCxatCibNm1KZ2dnOjs7s2nTprS3t7/FSwUAAAAAAHhzwwf9BcOH99tt8pqiKHL33Xfn1ltvzcUXX5wkefDBB9PU1JSHH344V155ZXp6enL//ffnS1/6UubOnZskWbVqVaZMmZJHH3008+fPz9NPP53Ozs6sX78+s2bNSpLcd999aW1tzdatW3P66ae/lesFAAAAAAA4qEGXJ88880xaWlrS0NCQWbNmZenSpTnttNPy7LPPpru7O21tbZXZhoaGnHfeeVm3bl2uvPLKbNy4MX19ff1mWlpaMn369Kxbty7z58/PD3/4wzQ2NlaKkyQ599xz09jYmHXr1h2wPOnt7U1vb2/l9a5du5IkfX196evrG+xl1qTXvg9v9v1oGFa86XvAUDrULEM1kGdqhSxTS+SZWiHL1BJ5plbIMrWkGvM8mLUOqjyZNWtW/uZv/ibvfve78+KLL+b222/P7Nmzs2XLlnR3dydJmpqa+n1NU1NTnnvuuSRJd3d3RowYkZNPPnnAzGtf393dnUmTJg347EmTJlVm3siyZcty2223DTi+Zs2ajB49ejCXWfO6uroOen75+w987lvf+tYRXg0cvjfLMlQTeaZWyDK1RJ6pFbJMLZFnaoUsU0uqKc979uw55NlBlScXXnhh5Z9nzJiR1tbWvPOd78yDDz6Yc889N0lSV1fX72uKohhw7PVeP/NG82/2PrfcckuWLFlSeb1r165MmTIlbW1tGTdu3MEv7ATR19eXrq6uzJs3L/X19Qecm97xnQOee6pj/tFYGgzKoWYZqoE8UytkmVoiz9QKWaaWyDO1QpapJdWY59fuWHUoBn3brrIxY8ZkxowZeeaZZ/Kxj30syb/sHJk8eXJlZvv27ZXdKM3Nzdm3b1927NjRb/fJ9u3bM3v27MrMiy++OOCzXnrppQG7WsoaGhrS0NAw4Hh9fX3V/MYdK2/2Pendf+CSyveS44k/39QSeaZWyDK1RJ6pFbJMLZFnaoUsU0uqKc+DWedJb+WDent78/TTT2fy5MmZOnVqmpub+23R2bdvX9auXVspRmbOnJn6+vp+M9u2bctTTz1VmWltbU1PT0+eeOKJyszjjz+enp6eygwAAAAAAMDRMqidJzfeeGM+8pGP5NRTT8327dtz++23Z9euXbn00ktTV1eXxYsXZ+nSpZk2bVqmTZuWpUuXZvTo0Vm0aFGSpLGxMZdddlluuOGGTJgwIePHj8+NN96YGTNmZO7cuUmSM844IxdccEEuv/zy3HvvvUmSK664IgsWLDjgw+IBAAAAAACOlEGVJy+88EI+/vGP55e//GV++7d/O+eee27Wr1+ft7/97UmSm266KXv37s1VV12VHTt2ZNasWVmzZk3Gjh1beY+77rorw4cPzyWXXJK9e/dmzpw5eeCBBzJs2LDKzEMPPZTrrrsubW1tSZKFCxdm5cqVR+J6AQAAAAAADmpQ5cnq1asPer6uri4dHR3p6Og44MzIkSOzYsWKrFix4oAz48ePz6pVqwazNAAAAAAAgCPiLT3zBAAAAAAAoNYoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASpQnAAAAAAAAJcoTAAAAAACAEuUJAAAAAABAifIEAAAAAACgRHkCAAAAAABQojwBAAAAAAAoUZ4AAAAAAACUKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASpQnAAAAAAAAJcoTAAAAAACAEuUJAAAAAABAifIEAAAAAACgRHkCAAAAAABQojwBAAAAAAAoUZ4AAAAAAACUKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASt5SebJs2bLU1dVl8eLFlWNFUaSjoyMtLS0ZNWpUzj///GzZsqXf1/X29ubaa6/NxIkTM2bMmCxcuDAvvPBCv5kdO3akvb09jY2NaWxsTHt7e3bu3PlWlgsAAAAAAPCmDrs82bBhQ77whS/kzDPP7Hd8+fLlufPOO7Ny5cps2LAhzc3NmTdvXnbv3l2ZWbx4cR555JGsXr06jz32WF5++eUsWLAg+/fvr8wsWrQomzZtSmdnZzo7O7Np06a0t7cf7nIBAAAAAAAOyWGVJy+//HI+8YlP5L777svJJ59cOV4URe6+++7ceuutufjiizN9+vQ8+OCD2bNnTx5++OEkSU9PT+6///78+Z//eebOnZuzzz47q1atyubNm/Poo48mSZ5++ul0dnbmr/7qr9La2prW1tbcd999+cY3vpGtW7cegcsGAAAAAAB4Y8MP54uuvvrqXHTRRZk7d25uv/32yvFnn3023d3daWtrqxxraGjIeeedl3Xr1uXKK6/Mxo0b09fX12+mpaUl06dPz7p16zJ//vz88Ic/TGNjY2bNmlWZOffcc9PY2Jh169bl9NNPH7Cm3t7e9Pb2Vl7v2rUrSdLX15e+vr7Ducya89r34c2+Hw3Dijd9DxhKh5plqAbyTK2QZWqJPFMrZJlaIs/UClmmllRjngez1kGXJ6tXr86PfvSjbNiwYcC57u7uJElTU1O/401NTXnuuecqMyNGjOi3Y+W1mde+vru7O5MmTRrw/pMmTarMvN6yZcty2223DTi+Zs2ajB49+hCu7MTR1dV10PPL33/gc9/61reO8Grg8L1ZlqGayDO1QpapJfJMrZBlaok8UytkmVpSTXnes2fPIc8Oqjx5/vnnc/3112fNmjUZOXLkAefq6ur6vS6KYsCx13v9zBvNH+x9brnllixZsqTyeteuXZkyZUra2toybty4g372iaKvry9dXV2ZN29e6uvrDzg3veM7Bzz3VMf8o7E0GJRDzTJUA3mmVsgytUSeqRWyTC2RZ2qFLFNLqjHPr92x6lAMqjzZuHFjtm/fnpkzZ1aO7d+/Pz/4wQ+ycuXKyvNIuru7M3ny5MrM9u3bK7tRmpubs2/fvuzYsaPf7pPt27dn9uzZlZkXX3xxwOe/9NJLA3a1vKahoSENDQ0DjtfX11fNb9yx8mbfk979By66fC85nvjzTS2RZ2qFLFNL5JlaIcvUEnmmVsgytaSa8jyYdQ7qgfFz5szJ5s2bs2nTpsqvc845J5/4xCeyadOmnHbaaWlubu63TWffvn1Zu3ZtpRiZOXNm6uvr+81s27YtTz31VGWmtbU1PT09eeKJJyozjz/+eHp6eiozAAAAAAAAR8Ogdp6MHTs206dP73dszJgxmTBhQuX44sWLs3Tp0kybNi3Tpk3L0qVLM3r06CxatChJ0tjYmMsuuyw33HBDJkyYkPHjx+fGG2/MjBkzMnfu3CTJGWeckQsuuCCXX3557r333iTJFVdckQULFrzhw+IBAAAAAACOlEE/MP7N3HTTTdm7d2+uuuqq7NixI7NmzcqaNWsyduzYysxdd92V4cOH55JLLsnevXszZ86cPPDAAxk2bFhl5qGHHsp1112Xtra2JMnChQuzcuXKI71cAAAAAACAft5yefL973+/3+u6urp0dHSko6PjgF8zcuTIrFixIitWrDjgzPjx47Nq1aq3ujwAAAAAAIBBGdQzTwAAAAAAAGqd8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASpQnAAAAAAAAJcoTAAAAAACAEuUJAAAAAABAifIEAAAAAACgRHkCAAAAAABQojwBAAAAAAAoUZ4AAAAAAACUKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASpQnAAAAAAAAJcoTAAAAAACAEuUJAAAAAABAifIEAAAAAACgRHkCAAAAAABQMnyoF8DQeMfN3xzqJQAAAAAAwHHJzhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKBlUeXLPPffkzDPPzLhx4zJu3Li0trbm29/+duV8URTp6OhIS0tLRo0alfPPPz9btmzp9x69vb259tprM3HixIwZMyYLFy7MCy+80G9mx44daW9vT2NjYxobG9Pe3p6dO3ce/lUCAAAAAAAcokGVJ6ecckruuOOOPPnkk3nyySfz4Q9/OB/96EcrBcny5ctz5513ZuXKldmwYUOam5szb9687N69u/IeixcvziOPPJLVq1fnsccey8svv5wFCxZk//79lZlFixZl06ZN6ezsTGdnZzZt2pT29vYjdMkAAAAAAAAHNnwwwx/5yEf6vf7c5z6Xe+65J+vXr8973/ve3H333bn11ltz8cUXJ0kefPDBNDU15eGHH86VV16Znp6e3H///fnSl76UuXPnJklWrVqVKVOm5NFHH838+fPz9NNPp7OzM+vXr8+sWbOSJPfdd19aW1uzdevWnH766UfiugEAAAAAAN7QoMqTsv379+dv//Zv88orr6S1tTXPPvtsuru709bWVplpaGjIeeedl3Xr1uXKK6/Mxo0b09fX12+mpaUl06dPz7p16zJ//vz88Ic/TGNjY6U4SZJzzz03jY2NWbdu3QHLk97e3vT29lZe79q1K0nS19eXvr6+w73MmvLa96Gvry8Nw4q39B4wlMpZhmonz9QKWaaWyDO1QpapJfJMrZBlakk15nkwax10ebJ58+a0trbm17/+dX7rt34rjzzySN773vdm3bp1SZKmpqZ+801NTXnuueeSJN3d3RkxYkROPvnkATPd3d2VmUmTJg343EmTJlVm3siyZcty2223DTi+Zs2ajB49enAXWeO6urqy/P2H97Xf+ta3juxi4C3o6uoa6iXAESPP1ApZppbIM7VClqkl8kytkGVqSTXlec+ePYc8O+jy5PTTT8+mTZuyc+fO/N3f/V0uvfTSrF27tnK+rq6u33xRFAOOvd7rZ95o/s3e55ZbbsmSJUsqr3ft2pUpU6akra0t48aNe9PrOhH09fWlq6sr8+bNy9mf++5hvcdTHfOP8Kpg8MpZrq+vH+rlwFsiz9QKWaaWyDO1QpapJfJMrZBlakk15vm1O1YdikGXJyNGjMi73vWuJMk555yTDRs25C/+4i/y6U9/Osm/7ByZPHlyZX779u2V3SjNzc3Zt29fduzY0W/3yfbt2zN79uzKzIsvvjjgc1966aUBu1rKGhoa0tDQMOB4fX191fzGHSv19fXp3X/wQutgXwvHC3++qSXyTK2QZWqJPFMrZJlaIs/UClmmllRTngezzpPe6ocVRZHe3t5MnTo1zc3N/bbo7Nu3L2vXrq0UIzNnzkx9fX2/mW3btuWpp56qzLS2tqanpydPPPFEZebxxx9PT09PZQYAAAAAAOBoGdTOk8985jO58MILM2XKlOzevTurV6/O97///XR2dqauri6LFy/O0qVLM23atEybNi1Lly7N6NGjs2jRoiRJY2NjLrvsstxwww2ZMGFCxo8fnxtvvDEzZszI3LlzkyRnnHFGLrjgglx++eW59957kyRXXHFFFixYcMCHxQMAAAAAABwpgypPXnzxxbS3t2fbtm1pbGzMmWeemc7OzsybNy9JctNNN2Xv3r256qqrsmPHjsyaNStr1qzJ2LFjK+9x1113Zfjw4bnkkkuyd+/ezJkzJw888ECGDRtWmXnooYdy3XXXpa2tLUmycOHCrFy58khcLwAAAAAAwEENqjy5//77D3q+rq4uHR0d6ejoOODMyJEjs2LFiqxYseKAM+PHj8+qVasGszQAAAAAAIAj4i0/8wQAAAAAAKCWKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXDh3oBVJd33PzNA577+R0XHcOVAAAAAADA0WHnCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASpQnAAAAAAAAJcoTAAAAAACAEuUJAAAAAABAifIEAAAAAACgRHkCAAAAAABQojwBAAAAAAAoUZ4AAAAAAACUKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASpQnAAAAAAAAJcoTAAAAAACAEuUJAAAAAABAifIEAAAAAACgRHkCAAAAAABQojwBAAAAAAAoUZ4AAAAAAACUKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEoGVZ4sW7Ysv/M7v5OxY8dm0qRJ+djHPpatW7f2mymKIh0dHWlpacmoUaNy/vnnZ8uWLf1ment7c+2112bixIkZM2ZMFi5cmBdeeKHfzI4dO9Le3p7GxsY0Njamvb09O3fuPLyrBAAAAAAAOESDKk/Wrl2bq6++OuvXr09XV1d+85vfpK2tLa+88kplZvny5bnzzjuzcuXKbNiwIc3NzZk3b152795dmVm8eHEeeeSRrF69Oo899lhefvnlLFiwIPv376/MLFq0KJs2bUpnZ2c6OzuzadOmtLe3H4FLBgAAAAAAOLDhgxnu7Ozs9/qLX/xiJk2alI0bN+ZDH/pQiqLI3XffnVtvvTUXX3xxkuTBBx9MU1NTHn744Vx55ZXp6enJ/fffny996UuZO3dukmTVqlWZMmVKHn300cyfPz9PP/10Ojs7s379+syaNStJct9996W1tTVbt27N6aefPmBtvb296e3trbzetWtXkqSvry99fX2Ducya9dr3oa+vLw3DiiP+/qff+o0DnnuqY/4R/zxOXOUsQ7WTZ2qFLFNL5JlaIcvUEnmmVsgytaQa8zyYtdYVRXHY/xX9H//xHzNt2rRs3rw506dPz89+9rO8853vzI9+9KOcffbZlbmPfvSjedvb3pYHH3ww3/3udzNnzpz86le/ysknn1yZOeuss/Kxj30st912W/76r/86S5YsGXCbrre97W2566678id/8icD1tLR0ZHbbrttwPGHH344o0ePPtxLBAAAAAAAasCePXuyaNGi9PT0ZNy4cQedHdTOk7KiKLJkyZJ88IMfzPTp05Mk3d3dSZKmpqZ+s01NTXnuuecqMyNGjOhXnLw289rXd3d3Z9KkSQM+c9KkSZWZ17vllluyZMmSyutdu3ZlypQpaWtre9Nvwomir68vXV1dmTdvXs7+3HeP6WfbecKRVM5yfX39UC8H3hJ5plbIMrVEnqkVskwtkWdqhSxTS6oxz6/dsepQHHZ5cs011+QnP/lJHnvssQHn6urq+r0uimLAsdd7/cwbzR/sfRoaGtLQ0DDgeH19fdX8xh0r9fX16d1/8N+Po/GZcKT5800tkWdqhSxTS+SZWiHL1BJ5plbIMrWkmvI8mHUO6oHxr7n22mvzta99Ld/73vdyyimnVI43NzcnyYDdIdu3b6/sRmlubs6+ffuyY8eOg868+OKLAz73pZdeGrCrBQAAAAAA4EgaVHlSFEWuueaafOUrX8l3v/vdTJ06td/5qVOnprm5OV1dXZVj+/bty9q1azN79uwkycyZM1NfX99vZtu2bXnqqacqM62trenp6ckTTzxRmXn88cfT09NTmQEAAAAAADgaBnXbrquvvjoPP/xw/tf/+l8ZO3ZsZYdJY2NjRo0albq6uixevDhLly7NtGnTMm3atCxdujSjR4/OokWLKrOXXXZZbrjhhkyYMCHjx4/PjTfemBkzZmTu3LlJkjPOOCMXXHBBLr/88tx7771JkiuuuCILFizI6aeffiSvHwAAAAAAoJ9BlSf33HNPkuT888/vd/yLX/xi/viP/zhJctNNN2Xv3r256qqrsmPHjsyaNStr1qzJ2LFjK/N33XVXhg8fnksuuSR79+7NnDlz8sADD2TYsGGVmYceeijXXXdd2trakiQLFy7MypUrD+caAQAAAAAADtmgypOiKN50pq6uLh0dHeno6DjgzMiRI7NixYqsWLHigDPjx4/PqlWrBrM8AAAAAACAt+ywHhgPAAAAAABQq5QnAAAAAAAAJcoTAAAAAACAEuUJAAAAAABAifIEAAAAAACgRHkCAAAAAABQojwBAAAAAAAoUZ4AAAAAAACUKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAICS4UO9AE4M77j5mwc89/M7LjqGKwEAAAAAgIOz8wQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASoYP9QLgHTd/84Dnfn7HRcdwJQAAAAAAYOcJAAAAAABAP8oTAAAAAACAErft4rh2sFt6HYzbfQEAAAAAcLjsPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgJLhQ70AOBrecfM3D3ju53dcdAxXAgAAAABAtbHzBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlHhgPJR40DwAAAAAAHaeAAAAAAAAlChPAAAAAAAASty2ixPOwW7NBQAAAAAAdp4AAAAAAACUKE8AAAAAAABKlCcAAAAAAAAlyhMAAAAAAIAS5QkAAAAAAECJ8gQAAAAAAKBEeQIAAAAAAFCiPAEAAAAAACgZPtQLgGrxjpu/ecBzP7/jomO4EgAAAAAAjiY7TwAAAAAAAEqUJwAAAAAAACXKEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoGTQ5ckPfvCDfOQjH0lLS0vq6ury1a9+td/5oijS0dGRlpaWjBo1Kueff362bNnSb6a3tzfXXnttJk6cmDFjxmThwoV54YUX+s3s2LEj7e3taWxsTGNjY9rb27Nz585BXyAAAAAAAMBgDB/sF7zyyis566yz8id/8if59//+3w84v3z58tx555154IEH8u53vzu333575s2bl61bt2bs2LFJksWLF+frX/96Vq9enQkTJuSGG27IggULsnHjxgwbNixJsmjRorzwwgvp7OxMklxxxRVpb2/P17/+9bdyvXBUvOPmbx7w3M/vuOgYrgQAAAAAgLdq0OXJhRdemAsvvPANzxVFkbvvvju33nprLr744iTJgw8+mKampjz88MO58sor09PTk/vvvz9f+tKXMnfu3CTJqlWrMmXKlDz66KOZP39+nn766XR2dmb9+vWZNWtWkuS+++5La2trtm7dmtNPP/1wrxcAAAAAAOCgBl2eHMyzzz6b7u7utLW1VY41NDTkvPPOy7p163LllVdm48aN6evr6zfT0tKS6dOnZ926dZk/f35++MMfprGxsVKcJMm5556bxsbGrFu37g3Lk97e3vT29lZe79q1K0nS19eXvr6+I3mZVeu170NfX18ahhVDvJoTh/wdeeUsQ7WTZ2qFLFNL5JlaIcvUEnmmVsgytaQa8zyYtR7R8qS7uztJ0tTU1O94U1NTnnvuucrMiBEjcvLJJw+Yee3ru7u7M2nSpAHvP2nSpMrM6y1btiy33XbbgONr1qzJ6NGjB38xNayrqyvL3z/UqzhxfOtb3xrqJdSsrq6uoV4CHDHyTK2QZWqJPFMrZJlaIs/UClmmllRTnvfs2XPIs0e0PHlNXV1dv9dFUQw49nqvn3mj+YO9zy233JIlS5ZUXu/atStTpkxJW1tbxo0bN5jl16y+vr50dXVl3rx5Oftz3x3q5ZwwnuqYP9RLqDnlLNfX1w/1cuAtkWdqhSxTS+SZWiHL1BJ5plbIMrWkGvP82h2rDsURLU+am5uT/MvOkcmTJ1eOb9++vbIbpbm5Ofv27cuOHTv67T7Zvn17Zs+eXZl58cUXB7z/Sy+9NGBXy2saGhrS0NAw4Hh9fX3V/MYdK/X19endf/AyiyNH/o4ef76pJfJMrZBlaok8UytkmVoiz9QKWaaWVFOeB7POk47kB0+dOjXNzc39tuns27cva9eurRQjM2fOTH19fb+Zbdu25amnnqrMtLa2pqenJ0888URl5vHHH09PT09lBgAAAAAA4GgY9M6Tl19+Of/4j/9Yef3ss89m06ZNGT9+fE499dQsXrw4S5cuzbRp0zJt2rQsXbo0o0ePzqJFi5IkjY2Nueyyy3LDDTdkwoQJGT9+fG688cbMmDEjc+fOTZKcccYZueCCC3L55Zfn3nvvTZJcccUVWbBgwRs+LB6q1Ttu/uYBz/38jouO4UoAAAAAAHjNoMuTJ598Mv/23/7byuvXnjNy6aWX5oEHHshNN92UvXv35qqrrsqOHTsya9asrFmzJmPHjq18zV133ZXhw4fnkksuyd69ezNnzpw88MADGTZsWGXmoYceynXXXZe2trYkycKFC7Ny5crDvlAAAAAAAIBDMejy5Pzzz09RFAc8X1dXl46OjnR0dBxwZuTIkVmxYkVWrFhxwJnx48dn1apVg10eAAAAAADAW3JEn3kCAAAAAABQ7Qa98wQ4NjwPBQAAAABgaNh5AgAAAAAAUKI8AQAAAAAAKHHbLqhCbukFAAAAAHD02HkCAAAAAABQojwBAAAAAAAocdsuqDFu6QUAAAAA8NbYeQIAAAAAAFBi5wlQcbBdKwdjRwsAAAAAUEuUJ8CQcYsxAAAAAOB4pDwB3jIlCAAAAABQS5QncAI53NtyneiUQwAAAABwYvHAeAAAAAAAgBI7T+AoO9F3exxP128HCQAAAABwKJQnQNWZ3vGdLH//v/xv7/66fueUIAAAAADAW+W2XQAAAAAAACV2ngDHpYPdYqth2LH9vMP9uoPtgnELMQAAAAA4filPAI6S4+l5LwAAAADAoXPbLgAAAAAAgBI7TwBqhFuBAQAAAMCRoTwBOM643RcAAAAADC3lCcAJwK4UAAAAADh0nnkCAAAAAABQYucJAAdkxwoAAAAAJyLlCcAJzjNWAAAAAKA/t+0CAAAAAAAosfMEgCPuzXazuOUXAAAAAMcz5QlQU9yCCgAAAAB4q9y2CwAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKPHMEwCOuYM9m8bD5AEAAAAYasoTAI4rBytWDkbpAgAAAMCR4rZdAAAAAAAAJXaeAHBYDneHCAAAAAAc75QnANQEz1EBAAAA4EhRngBQ8xQrAAAAAAyG8gSAE5piBQAAAIDXU54AwGFQugAAAADULuUJABzAwQoSAAAAAGqX8gQAjhN2swAAAAAcH5QnAHCEDWbHSsOwIsvfn0zv+E6SuqO3KAAAAAAO2UlDvQAAAAAAAIDjiZ0nAHCCcpswAAAAgDemPAGAKnA8FR3H01oAAAAAjgblCQDUsME8f+VIfB0AAABALVCeAABHzOGWLnasAAAAAMcT5QkAcFxzmzAAAADgWFOeAECVO5FvsfVWrl3xAgAAAByI8gQAGHIncgEEAAAAHH+UJwDACelo3A7MLcYAAACgNihPAABe53gqVhQyAAAAcOwpTwAAhpjblgEAAMDxRXkCAFCljqfS5Zn/1jbUSwAAAIAjRnkCADAIx1NhcTyZ3vGdLH//v/xv7/66fueOp9uSuQ0aAAAAh0J5AgDAUXW4hdOxLqqO1ucd6+fkAAAA8NYpTwAA4Cg6GiXI0Sh6FDIAAAD/v+O+PPn85z+fP/uzP8u2bdvyvve9L3fffXd+93d/d6iXBQAAb9nxdBu442ktB3M83QYOAACoXcd1efLlL385ixcvzuc///l84AMfyL333psLL7wwP/3pT3PqqacO9fIAAIBj7FjcBq5hWHHAZ/gcCUeryDmeyqPjaS0AAHA4juvy5M4778xll12WP/3TP02S3H333fnOd76Te+65J8uWLes329vbm97e3srrnp6eJMmvfvWr9PX1HbtFH8f6+vqyZ8+e/N//+38z/DevDPVy4LANf7XInj2vZnjfSdn/6pH/DxpwLMkztUKWqSVHO8/vuvH/OeLvmRz8X+6O1mceyPG0lsdvmXPE33PWsr8/rM871l9X/nfA+vr6A84dSYe7VngzQ5FnOBpkmVpSjXnevXt3kqQoijedrSsOZWoI7Nu3L6NHj87f/u3f5vd+7/cqx6+//vps2rQpa9eu7Tff0dGR22677VgvEwAAAAAAqCLPP/98TjnllIPOHLc7T375y19m//79aWpq6ne8qakp3d3dA+ZvueWWLFmypPL61Vdfza9+9atMmDAhdXX+349JsmvXrkyZMiXPP/98xo0bN9TLgcMmy9QSeaZWyDK1RJ6pFbJMLZFnaoUsU0uqMc9FUWT37t1paWl509njtjx5zeuLj6Io3rAMaWhoSENDQ79jb3vb247m0qrWuHHjqibMcDCyTC2RZ2qFLFNL5JlaIcvUEnmmVsgytaTa8tzY2HhIcycd5XUctokTJ2bYsGEDdpls3759wG4UAAAAAACAI+W4LU9GjBiRmTNnpqurq9/xrq6uzJ49e4hWBQAAAAAA1Lrj+rZdS5YsSXt7e84555y0trbmC1/4Qn7xi1/kU5/61FAvrSo1NDTks5/97IDbm0G1kWVqiTxTK2SZWiLP1ApZppbIM7VClqkltZ7nuqIoiqFexMF8/vOfz/Lly7Nt27ZMnz49d911Vz70oQ8N9bIAAAAAAIAaddyXJwAAAAAAAMfScfvMEwAAAAAAgKGgPAEAAAAAAChRngAAAAAAAJQoTwAAAAAAAEqUJyeIz3/+85k6dWpGjhyZmTNn5n//7/891EuCAX7wgx/kIx/5SFpaWlJXV5evfvWr/c4XRZGOjo60tLRk1KhROf/887Nly5Z+M729vbn22mszceLEjBkzJgsXLswLL7xwDK8CkmXLluV3fud3Mnbs2EyaNCkf+9jHsnXr1n4z8kw1uOeee3LmmWdm3LhxGTduXFpbW/Ptb3+7cl6OqVbLli1LXV1dFi9eXDkmz1SLjo6O1NXV9fvV3NxcOS/LVJt/+qd/yh/+4R9mwoQJGT16dP71v/7X2bhxY+W8TFMN3vGOdwz42VxXV5err746iRxTXX7zm9/kv/yX/5KpU6dm1KhROe200/Jf/+t/zauvvlqZOVEyrTw5AXz5y1/O4sWLc+utt+bHP/5xfvd3fzcXXnhhfvGLXwz10qCfV155JWeddVZWrlz5hueXL1+eO++8MytXrsyGDRvS3NycefPmZffu3ZWZxYsX55FHHsnq1avz2GOP5eWXX86CBQuyf//+Y3UZkLVr1+bqq6/O+vXr09XVld/85jdpa2vLK6+8UpmRZ6rBKaeckjvuuCNPPvlknnzyyXz4wx/ORz/60cpfiuWYarRhw4Z84QtfyJlnntnvuDxTTd73vvdl27ZtlV+bN2+unJNlqsmOHTvygQ98IPX19fn2t7+dn/70p/nzP//zvO1tb6vMyDTVYMOGDf1+Lnd1dSVJfv/3fz+JHFNd/vt//+/5y7/8y6xcuTJPP/10li9fnj/7sz/LihUrKjMnTKYLat773//+4lOf+lS/Y+95z3uKm2++eYhWBG8uSfHII49UXr/66qtFc3Nzcccdd1SO/frXvy4aGxuLv/zLvyyKoih27txZ1NfXF6tXr67M/NM//VNx0kknFZ2dncds7fB627dvL5IUa9euLYpCnqluJ598cvFXf/VXckxV2r17dzFt2rSiq6urOO+884rrr7++KAo/l6kun/3sZ4uzzjrrDc/JMtXm05/+dPHBD37wgOdlmmp1/fXXF+985zuLV199VY6pOhdddFHxyU9+st+xiy++uPjDP/zDoihOrJ/Ndp7UuH379mXjxo1pa2vrd7ytrS3r1q0bolXB4D377LPp7u7ul+WGhoacd955lSxv3LgxfX19/WZaWloyffp0eWdI9fT0JEnGjx+fRJ6pTvv378/q1avzyiuvpLW1VY6pSldffXUuuuiizJ07t99xeabaPPPMM2lpacnUqVPzB3/wB/nZz36WRJapPl/72tdyzjnn5Pd///czadKknH322bnvvvsq52WaarRv376sWrUqn/zkJ1NXVyfHVJ0PfvCD+fu///v8wz/8Q5Lk//yf/5PHHnss/+7f/bskJ9bP5uFDvQCOrl/+8pfZv39/mpqa+h1vampKd3f3EK0KBu+1vL5Rlp977rnKzIgRI3LyyScPmJF3hkpRFFmyZEk++MEPZvr06UnkmeqyefPmtLa25te//nV+67d+K4888kje+973Vv7CK8dUi9WrV+dHP/pRNmzYMOCcn8tUk1mzZuVv/uZv8u53vzsvvvhibr/99syePTtbtmyRZarOz372s9xzzz1ZsmRJPvOZz+SJJ57Iddddl4aGhvzRH/2RTFOVvvrVr2bnzp354z/+4yT+nkH1+fSnP52enp685z3vybBhw7J///587nOfy8c//vEkJ1amlScniLq6un6vi6IYcAyqweFkWd4ZStdcc01+8pOf5LHHHhtwTp6pBqeffno2bdqUnTt35u/+7u9y6aWXZu3atZXzckw1eP7553P99ddnzZo1GTly5AHn5JlqcOGFF1b+ecaMGWltbc073/nOPPjggzn33HOTyDLV49VXX80555yTpUuXJknOPvvsbNmyJffcc0/+6I/+qDIn01ST+++/PxdeeGFaWlr6HZdjqsWXv/zlrFq1Kg8//HDe9773ZdOmTVm8eHFaWlpy6aWXVuZOhEy7bVeNmzhxYoYNGzag0du+ffuAdhCOZ83NzUly0Cw3Nzdn37592bFjxwFn4Fi69tpr87WvfS3f+973csopp1SOyzPVZMSIEXnXu96Vc845J8uWLctZZ52Vv/iLv5BjqsrGjRuzffv2zJw5M8OHD8/w4cOzdu3a/I//8T8yfPjwSh7lmWo0ZsyYzJgxI88884yfzVSdyZMn573vfW+/Y2eccUZ+8YtfJPH3ZqrPc889l0cffTR/+qd/Wjkmx1Sb//yf/3Nuvvnm/MEf/EFmzJiR9vb2/Kf/9J+ybNmyJCdWppUnNW7EiBGZOXNmurq6+h3v6urK7Nmzh2hVMHhTp05Nc3Nzvyzv27cva9eurWR55syZqa+v7zezbdu2PPXUU/LOMVUURa655pp85StfyXe/+91MnTq133l5ppoVRZHe3l45pqrMmTMnmzdvzqZNmyq/zjnnnHziE5/Ipk2bctppp8kzVau3tzdPP/10Jk+e7GczVecDH/hAtm7d2u/YP/zDP+Ttb397En9vpvp88YtfzKRJk3LRRRdVjskx1WbPnj056aT+tcGwYcPy6quvJjnBMn1sn0/PUFi9enVRX19f3H///cVPf/rTYvHixcWYMWOKn//850O9NOhn9+7dxY9//OPixz/+cZGkuPPOO4sf//jHxXPPPVcURVHccccdRWNjY/GVr3yl2Lx5c/Hxj3+8mDx5crFr167Ke3zqU58qTjnllOLRRx8tfvSjHxUf/vCHi7POOqv4zW9+M1SXxQnoP/7H/1g0NjYW3//+94tt27ZVfu3Zs6cyI89Ug1tuuaX4wQ9+UDz77LPFT37yk+Izn/lMcdJJJxVr1qwpikKOqW7nnXdecf3111deyzPV4oYbbii+//3vFz/72c+K9evXFwsWLCjGjh1b+fc7WaaaPPHEE8Xw4cOLz33uc8UzzzxTPPTQQ8Xo0aOLVatWVWZkmmqxf//+4tRTTy0+/elPDzgnx1STSy+9tPhX/+pfFd/4xjeKZ599tvjKV75STJw4sbjpppsqMydKppUnJ4j/+T//Z/H2t7+9GDFiRPFv/s2/KdauXTvUS4IBvve97xVJBvy69NJLi6IoildffbX47Gc/WzQ3NxcNDQ3Fhz70oWLz5s393mPv3r3FNddcU4wfP74YNWpUsWDBguIXv/jFEFwNJ7I3ynGS4otf/GJlRp6pBp/85Ccrf3/47d/+7WLOnDmV4qQo5Jjq9vryRJ6pFv/hP/yHYvLkyUV9fX3R0tJSXHzxxcWWLVsq52WZavP1r3+9mD59etHQ0FC85z3vKb7whS/0Oy/TVIvvfOc7RZJi69atA87JMdVk165dxfXXX1+ceuqpxciRI4vTTjutuPXWW4ve3t7KzImS6bqiKIoh2fICAAAAAABwHPLMEwAAAAAAgBLlCQAAAAAAQInyBAAAAAAAoER5AgAAAAAAUKI8AQAAAAAAKFGeAAAAAAAAlChPAAAAAAAASpQnAAAAAAAAJcoTAAAAAACAEuUJAAAAAABAifIEAAAAAACg5P8FPeQcVkPinIkAAAAASUVORK5CYII=",
                        "text/plain": [
                            "<Figure size 2000x500 with 1 Axes>"
                        ]
                    },
                    "metadata": {},
                    "output_type": "display_data"
                }
            ],
            "source": [
                "# Plot the distribution of the number of records for each patient\n",
                "tmp_df.hist(bins=200, figsize=(20, 5))"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 19,
            "id": "7052d2af",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "count    54442.000000\n",
                            "mean        90.530197\n",
                            "std         93.926015\n",
                            "min          1.000000\n",
                            "25%         17.000000\n",
                            "50%         59.000000\n",
                            "75%        135.000000\n",
                            "max        786.000000\n",
                            "dtype: float64"
                        ]
                    },
                    "execution_count": 19,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "tmp_df.describe()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "id": "d5241f2e",
            "metadata": {},
            "outputs": [],
            "source": []
        },
        {
            "cell_type": "code",
            "execution_count": 46,
            "metadata": {},
            "outputs": [],
            "source": [
                "ids_before = Mask_df.loc[Mask_df['Time'] < 1440].groupby('ID').size()\n",
                "ids_after = Mask_df.loc[Mask_df['Time'] > 1440].groupby('ID').size()"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 47,
            "id": "fa316b18",
            "metadata": {},
            "outputs": [
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "ids_before_selected:  (31804,)\n",
                        "ids_after_selected:  (27320,)\n"
                    ]
                }
            ],
            "source": [
                "ids_before_selected = ids_before.loc[ids_before >= 20].index\n",
                "ids_after_selected = ids_after.loc[ids_after >= 20].index\n",
                "\n",
                "print(\"ids_before_selected: \", ids_before_selected.shape)\n",
                "print(\"ids_after_selected: \", ids_after_selected.shape)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "metadata": {},
            "outputs": [],
            "source": []
        },
        {
            "cell_type": "code",
            "execution_count": 48,
            "metadata": {},
            "outputs": [],
            "source": [
                "df_var_num = Mask_df.iloc[:, 1:].groupby(\"ID\").apply(lambda x: x.sum(axis=0).gt(0).sum())"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 49,
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "<AxesSubplot: >"
                        ]
                    },
                    "execution_count": 49,
                    "metadata": {},
                    "output_type": "execute_result"
                },
                {
                    "data": {
                        "image/png": "iVBORw0KGgoAAAANSUhEUgAAAjEAAAGdCAYAAADjWSL8AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjYuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8o6BhiAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAoe0lEQVR4nO3df3BT9Z7/8VdoS6DcNpfCbdMOFbtuYd0t19ktCsV7BS80hbFyudxZ7m53OsiyiCPi7RTGAR2/Bu+9heUPcLesiC4DCnbKH3urzuAWwtxrka0odLdzgWVQZ0FBKfVyS8qvm8b27B9+e9Y0KU1K2uRTno+ZDJ5P3p+TT/Jum5cnOYnDsixLAAAAhhmV6AUAAAAMBiEGAAAYiRADAACMRIgBAABGIsQAAAAjEWIAAICRCDEAAMBIhBgAAGCk1EQvYKj09PToyy+/VEZGhhwOR6KXAwAAomBZlq5evaq8vDyNGnXrYy0jNsR8+eWXys/PT/QyAADAIJw/f16TJk26Zc2IDTEZGRmSvnkQMjMzo5oTDAZ18OBBeTwepaWlDeXycAv0ITnQh+RAH5IDfRg+nZ2dys/Pt5/Hb2XEhpjel5AyMzNjCjHp6enKzMzkhzSB6ENyoA/JgT4kB/ow/KJ5Kwhv7AUAAEYixAAAACMRYgAAgJEIMQAAwEiEGAAAYCRCDAAAMBIhBgAAGIkQAwAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASIQYAABgJEIMAAAwEiEGQERF3gP2v3ev25/g1QBAuNRELwDA8OsbSs5temRE3BaAOwtHYgAAgJEIMQAAwEiEGAAAYCRCDAAAMBIhBgAAGImzkwCDRTr1mbN/ANwpCDEAEo7TsAEMBi8nAQAAIxFiAACAkQgxAADASIQYAABgJEIMAAAwEmcnARg0zioCkEgciQEAAEYixAAAACPxchIAI/FpxQA4EgMAAIwUU4jZuHGj7r//fmVkZCg7O1uLFi3SmTNnQmoee+wxORyOkMvMmTNDagKBgFavXq2JEydq3LhxWrhwoS5cuBBS09HRocrKSrlcLrlcLlVWVurKlSuDu5cAAGDEiSnENDU1adWqVTp69Kh8Pp++/vpreTweXb9+PaRu/vz5unjxon159913Q66vqqpSQ0OD6uvrdeTIEV27dk3l5eXq7u62ayoqKtTa2qrGxkY1NjaqtbVVlZWVt3FXAQDASBLTe2IaGxtDtnft2qXs7Gy1tLTooYcessedTqfcbnfEffj9fu3cuVN79uzRvHnzJEl79+5Vfn6+Dh06pLKyMp0+fVqNjY06evSoZsyYIUl67bXXVFJSojNnzmjq1Kkx3UkAADDy3NZ7Yvx+vyQpKysrZPy9995Tdna2pkyZohUrVqi9vd2+rqWlRcFgUB6Pxx7Ly8tTUVGRmpubJUkffPCBXC6XHWAkaebMmXK5XHYNAAC4sw367CTLslRdXa0f/OAHKioqsscXLFigv/7rv9bkyZN19uxZPf/88/rRj36klpYWOZ1OtbW1afTo0Ro/fnzI/nJyctTW1iZJamtrU3Z2dthtZmdn2zV9BQIBBQIBe7uzs1OSFAwGFQwGo7pPvXXR1mNo0IfoOVOssLFoHre+8yLNcY6yQv6NWBPNfuJUM9CcaOeZht+H5EAfhk8sj7HDsqzwvwRRWLVqlfbv368jR45o0qRJ/dZdvHhRkydPVn19vRYvXqy6ujotW7YsJHBIUmlpqe655x698sorqqmp0euvvx72puHCwkItX75c69atC7sdr9erDRs2hI3X1dUpPT19MHcRAAAMsxs3bqiiokJ+v1+ZmZm3rB3UkZjVq1frnXfe0eHDh28ZYCQpNzdXkydP1ieffCJJcrvd6urqUkdHR8jRmPb2ds2aNcuuuXTpUti+vvrqK+Xk5ES8nfXr16u6utre7uzsVH5+vjwez4APQq9gMCifz6fS0lKlpaVFNQfxRx+iV+Q9EDZ20lsW87xIc4pfbNQvpvfo+eOjFOhxRKyJZj/xqhloTrTzTMPvQ3KgD8On95WUaMQUYizL0urVq9XQ0KD33ntPBQUFA865fPmyzp8/r9zcXElScXGx0tLS5PP5tGTJEknfHK05efKkNm/eLEkqKSmR3+/XRx99pAceeECS9OGHH8rv99tBpy+n0ymn0xk2npaWFvMP3GDmIP7u9D5E82FugW5HWE00j1nfeZHmBHoc9r+Bbkfkmmj2E6eageZEO89Ud/rvQ7KgD0Mvlsc3phCzatUq1dXV6e2331ZGRob9/hSXy6WxY8fq2rVr8nq9+ulPf6rc3FydO3dOzz77rCZOnKif/OQndu3y5cu1Zs0aTZgwQVlZWVq7dq2mTZtmn6107733av78+VqxYoV27NghSXr88cdVXl7OmUkAAEBSjCFm+/btkqQ5c+aEjO/atUuPPfaYUlJSdOLECb3xxhu6cuWKcnNz9fDDD2vfvn3KyMiw67du3arU1FQtWbJEN2/e1Ny5c7V7926lpKTYNW+++aaefvpp+yymhQsXatu2bYO9nwAAYISJ+eWkWxk7dqwOHAh/nbqvMWPGqLa2VrW1tf3WZGVlae/evbEsDwBC8P1KwMjGdycBAAAjEWIAAICRCDEAAMBIhBgAAGCkQX/tAIDB4w2nAHD7OBIDAACMxJEYABgAR86A5MSRGAAAYCRCDAAAMBIhBgAAGIkQAwAAjESIAQAARuLsJAB3tHidecQZTMDw40gMAAAwEiEGAAAYiRADAACMRIgBAABGIsQAAAAjEWIAAICRCDEAAMBIhBgAAGAkQgwAADASIQYAABiJEAMAAIxEiAEAAEYixAAAACMRYgAAgJEIMQAAwEiEGAAAYCRCDAAAMBIhBgAAGIkQAwAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASKmJXgAA3CnuXrc/bOzcpkcSsBJgZCDEAHHGExUADA9eTgIAAEYixAAAACMRYgAAgJEIMQAAwEiEGAAAYCRCDAAAMBIhBgAAGIkQAwAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASIQYAABgJEIMAAAwEiEGAAAYiRADAACMRIgBAABGiinEbNy4Uffff78yMjKUnZ2tRYsW6cyZMyE1lmXJ6/UqLy9PY8eO1Zw5c3Tq1KmQmkAgoNWrV2vixIkaN26cFi5cqAsXLoTUdHR0qLKyUi6XSy6XS5WVlbpy5crg7iUAGK7Ie0B3r9uvu9ftT/RSgKQRU4hpamrSqlWrdPToUfl8Pn399dfyeDy6fv26XbN582Zt2bJF27Zt07Fjx+R2u1VaWqqrV6/aNVVVVWpoaFB9fb2OHDmia9euqby8XN3d3XZNRUWFWltb1djYqMbGRrW2tqqysjIOdxkAAIwEqbEUNzY2hmzv2rVL2dnZamlp0UMPPSTLsvTSSy/pueee0+LFiyVJr7/+unJyclRXV6eVK1fK7/dr586d2rNnj+bNmydJ2rt3r/Lz83Xo0CGVlZXp9OnTamxs1NGjRzVjxgxJ0muvvaaSkhKdOXNGU6dOjcd9BwAABospxPTl9/slSVlZWZKks2fPqq2tTR6Px65xOp2aPXu2mpubtXLlSrW0tCgYDIbU5OXlqaioSM3NzSorK9MHH3wgl8tlBxhJmjlzplwul5qbmyOGmEAgoEAgYG93dnZKkoLBoILBYFT3p7cu2noMDdP74Eyxwsb63pfhrIlmjZHmOEdZIf9GrIlmP3GqGWhOpHkm1vR3fW8fopmD+DP975JJYnmMHZZlhf9WRcGyLP34xz9WR0eH3n//fUlSc3OzHnzwQX3xxRfKy8uzax9//HF99tlnOnDggOrq6rRs2bKQwCFJHo9HBQUF2rFjh2pqarR79259/PHHITVTpkzRsmXLtH79+rD1eL1ebdiwIWy8rq5O6enpg7mLAABgmN24cUMVFRXy+/3KzMy8Ze2gj8Q89dRT+t3vfqcjR46EXedwOEK2LcsKG+urb02k+lvtZ/369aqurra3Ozs7lZ+fL4/HM+CD0CsYDMrn86m0tFRpaWlRzUH8md6HIu+BsLGT3rKE1USzxkhzil9s1C+m9+j546MU6HFErIlmP/GqGWhOpHkm1vTV+/vQ24do5iD+TP+7ZJLeV1KiMagQs3r1ar3zzjs6fPiwJk2aZI+73W5JUltbm3Jzc+3x9vZ25eTk2DVdXV3q6OjQ+PHjQ2pmzZpl11y6dCnsdr/66it7P305nU45nc6w8bS0tJh/4AYzB/Fnah8C3eFBu+/9GM6aaNYYaU7vE2agx6FAtyNyTTT7iVPNQHMizTOxpj+9fYhlDuLP1L9LJonl8Y3p7CTLsvTUU0/p17/+tX7zm9+ooKAg5PqCggK53W75fD57rKurS01NTXZAKS4uVlpaWkjNxYsXdfLkSbumpKREfr9fH330kV3z4Ycfyu/32zUAAODOFtORmFWrVqmurk5vv/22MjIy1NbWJklyuVwaO3asHA6HqqqqVFNTo8LCQhUWFqqmpkbp6emqqKiwa5cvX641a9ZowoQJysrK0tq1azVt2jT7bKV7771X8+fP14oVK7Rjxw5J37yvpry8nDOTAACApBhDzPbt2yVJc+bMCRnftWuXHnvsMUnSM888o5s3b+rJJ59UR0eHZsyYoYMHDyojI8Ou37p1q1JTU7VkyRLdvHlTc+fO1e7du5WSkmLXvPnmm3r66afts5gWLlyobdu2DeY+AgCAESimEBPNiUwOh0Ner1der7ffmjFjxqi2tla1tbX91mRlZWnv3r2xLA8AANxB+O4kAABgJEIMAAAwEiEGAAAYiRADAACMRIgBAABGIsQAAAAjEWIAAICRCDEAAMBIhBgAAGAkQgwAADASIQYAABiJEAMAAIxEiAEAAEYixAAAACMRYgAAgJFSE70AwCR3r9sfNnZu0yMJWAkAgCMxAADASIQYAABgJEIMAAAwEiEGAAAYiRADAACMRIgBAABGIsQAAAAjEWIAAICRCDEAAMBIhBgAAGAkvnYAAEaAvl+Jwddh4E7AkRgAAGAkQgwAADASIQYAABiJEAMAAIxEiAEAAEYixAAAACMRYgAAgJEIMQAAwEiEGAAAYCRCDAAAMBIhBgAAGIkQAwAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASIQYAABgJEIMAAAwEiEGAAAYiRADAACMRIgBAABGIsQAAAAjEWIAAICRUhO9AADA8Lh73f6Q7XObHknQSoD44EgMAAAwEiEGAAAYiRADAACMRIgBAABGijnEHD58WI8++qjy8vLkcDj01ltvhVz/2GOPyeFwhFxmzpwZUhMIBLR69WpNnDhR48aN08KFC3XhwoWQmo6ODlVWVsrlcsnlcqmyslJXrlyJ+Q4CAICRKeYQc/36dd13333atm1bvzXz58/XxYsX7cu7774bcn1VVZUaGhpUX1+vI0eO6Nq1ayovL1d3d7ddU1FRodbWVjU2NqqxsVGtra2qrKyMdbkAAGCEivkU6wULFmjBggW3rHE6nXK73RGv8/v92rlzp/bs2aN58+ZJkvbu3av8/HwdOnRIZWVlOn36tBobG3X06FHNmDFDkvTaa6+ppKREZ86c0dSpU2NdNgAAGGGG5HNi3nvvPWVnZ+u73/2uZs+erV/96lfKzs6WJLW0tCgYDMrj8dj1eXl5KioqUnNzs8rKyvTBBx/I5XLZAUaSZs6cKZfLpebm5oghJhAIKBAI2NudnZ2SpGAwqGAwGNW6e+uircfQSOY+OFOssLG+60y2mkj6zos0xznKCvk3Yk00+4lTzUBzIs0zsaa/63v70N+coXqc8Y1k/rs00sTyGDssywr/rYp2ssOhhoYGLVq0yB7bt2+fvvOd72jy5Mk6e/asnn/+eX399ddqaWmR0+lUXV2dli1bFhI4JMnj8aigoEA7duxQTU2Ndu/erY8//jikZsqUKVq2bJnWr18fthav16sNGzaEjdfV1Sk9PX2wdxEAAAyjGzduqKKiQn6/X5mZmbesjfuRmJ/97Gf2fxcVFWn69OmaPHmy9u/fr8WLF/c7z7IsORwOe/vb/91fzbetX79e1dXV9nZnZ6fy8/Pl8XgGfBB6BYNB+Xw+lZaWKi0tLao5iL9k7kOR90DY2ElvWVLXRNJ3XqQ5xS826hfTe/T88VEK9Dgi1kSzn3jVDDQn0jwTa/rq/X3o7UN/c4bqccY3kvnv0kjT+0pKNIb8awdyc3M1efJkffLJJ5Ikt9utrq4udXR0aPz48XZde3u7Zs2aZddcunQpbF9fffWVcnJyIt6O0+mU0+kMG09LS4v5B24wcxB/ydiHQHd4iO67xmSriaTvvEhzep8wAz0OBbodkWui2U+cagaaE2meiTX96e1Df3OG6nFGqGT8uzTSxPL4DvnnxFy+fFnnz59Xbm6uJKm4uFhpaWny+Xx2zcWLF3Xy5Ek7xJSUlMjv9+ujjz6yaz788EP5/X67BgAA3NliPhJz7do1ffrpp/b22bNn1draqqysLGVlZcnr9eqnP/2pcnNzde7cOT377LOaOHGifvKTn0iSXC6Xli9frjVr1mjChAnKysrS2rVrNW3aNPtspXvvvVfz58/XihUrtGPHDknS448/rvLycs5MAgAAkgYRYo4fP66HH37Y3u59H8rSpUu1fft2nThxQm+88YauXLmi3NxcPfzww9q3b58yMjLsOVu3blVqaqqWLFmimzdvau7cudq9e7dSUlLsmjfffFNPP/20fRbTwoULb/nZNMDt6vsNvxLf8gsAySzmEDNnzhzd6oSmAwfC37jW15gxY1RbW6va2tp+a7KysrR3795YlwcAAO4QfHcSAAAwEiEGAAAYiRADAACMRIgBAABGIsQAAAAjEWIAAICRCDEAAMBIhBgAAGAkQgwAADASIQYAABiJEAMAAIxEiAEAAEYixAAAACMRYgAAgJEIMQAAwEiEGAAAYCRCDAAAMBIhBgAAGIkQAwAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASKmJXgAAIHncvW5/yPa5TY8kaCXAwDgSAwAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASIQYAABgJEIMAAAwEiEGAAAYiRADAACMRIgBAABGIsQAAAAjEWIAAICRCDEAAMBIhBgAAGAkQgwAADASIQYAABiJEAMAAIxEiAEAAEZKTfQCgHi7e93+sLFzmx5JwEoAAEOJIzEAAMBIhBgAAGAkQgwAADASIQYAABiJEAMAAIzE2UkAgJj0PQOQs/+QKByJAQAARiLEAAAAIxFiAACAkQgxAADASIQYAABgJEIMAAAwUswh5vDhw3r00UeVl5cnh8Oht956K+R6y7Lk9XqVl5ensWPHas6cOTp16lRITSAQ0OrVqzVx4kSNGzdOCxcu1IULF0JqOjo6VFlZKZfLJZfLpcrKSl25ciXmOwgAAEammEPM9evXdd9992nbtm0Rr9+8ebO2bNmibdu26dixY3K73SotLdXVq1ftmqqqKjU0NKi+vl5HjhzRtWvXVF5eru7ubrumoqJCra2tamxsVGNjo1pbW1VZWTmIuwgAAEaimD/sbsGCBVqwYEHE6yzL0ksvvaTnnntOixcvliS9/vrrysnJUV1dnVauXCm/36+dO3dqz549mjdvniRp7969ys/P16FDh1RWVqbTp0+rsbFRR48e1YwZMyRJr732mkpKSnTmzBlNnTp1sPcXAACMEHH9xN6zZ8+qra1NHo/HHnM6nZo9e7aam5u1cuVKtbS0KBgMhtTk5eWpqKhIzc3NKisr0wcffCCXy2UHGEmaOXOmXC6XmpubI4aYQCCgQCBgb3d2dkqSgsGggsFgVOvvrYu2HkPjdvvgTLH63eftzjOxJpK+8yLNcY6yQv6NWBPNfuJUM9CcSPNMrOnv+t4+9DdnOHsxmH6ZjueH4RPLY+ywLCv8tyrayQ6HGhoatGjRIklSc3OzHnzwQX3xxRfKy8uz6x5//HF99tlnOnDggOrq6rRs2bKQwCFJHo9HBQUF2rFjh2pqarR79259/PHHITVTpkzRsmXLtH79+rC1eL1ebdiwIWy8rq5O6enpg72LAABgGN24cUMVFRXy+/3KzMy8Ze2QfHeSw+EI2bYsK2ysr741kepvtZ/169erurra3u7s7FR+fr48Hs+AD0KvYDAon8+n0tJSpaWlRTUH8Xe7fSjyHggbO+kti8s8E2si6Tsv0pziFxv1i+k9ev74KAV6HBFrotlPvGoGmhNpnok1ffX+PvT2ob85w9mLwfTLdDw/DJ/eV1KiEdcQ43a7JUltbW3Kzc21x9vb25WTk2PXdHV1qaOjQ+PHjw+pmTVrll1z6dKlsP1/9dVX9n76cjqdcjqdYeNpaWkx/8ANZg7ib7B9CHSHB91o9hPNPBNrIuk7L9Kc3ifMQI9DgW5H5Jpo9hOnmoHmRJpnYk1/evvQ35zh7MVg+jVS8Pww9GJ5fOP6OTEFBQVyu93y+Xz2WFdXl5qamuyAUlxcrLS0tJCaixcv6uTJk3ZNSUmJ/H6/PvroI7vmww8/lN/vt2sAAMCdLeYjMdeuXdOnn35qb589e1atra3KysrSXXfdpaqqKtXU1KiwsFCFhYWqqalRenq6KioqJEkul0vLly/XmjVrNGHCBGVlZWnt2rWaNm2afbbSvffeq/nz52vFihXasWOHpG/eV1NeXs6ZSQAAQNIgQszx48f18MMP29u970NZunSpdu/erWeeeUY3b97Uk08+qY6ODs2YMUMHDx5URkaGPWfr1q1KTU3VkiVLdPPmTc2dO1e7d+9WSkqKXfPmm2/q6aefts9iWrhwYb+fTQMAAO48MYeYOXPm6FYnNDkcDnm9Xnm93n5rxowZo9raWtXW1vZbk5WVpb1798a6PAAAcIfgu5MAAICRCDEAAMBIhBgAAGAkQgwAADASIQYAABiJEAMAAIxEiAEAAEYixAAAACMRYgAAgJEIMQAAwEgxf+0AkEh3r9sfNnZu0yMJWAkAINE4EgMAAIxEiAEAAEYixAAAACPxnhgAQNz1ff8a713DUOBIDAAAMBIhBgAAGIkQAwAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASIQYAABgJEIMAAAwEiEGAAAYiRADAACMRIgBAABGIsQAAAAjEWIAAICRCDEAAMBIhBgAAGAkQgwAADASIQYAABiJEAMAAIxEiAEAAEYixAAAACMRYgAAgJEIMQAAwEiEGAAAYCRCDAAAMBIhBgAAGIkQAwAAjESIAQAARkpN9AIAAJCku9ftDxs7t+mRBKwEpuBIDAAAMBIhBgAAGIkQAwAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASIQYAABgJD7sDkmj94OunCmWNj8gFXkP6MyvyhO8KgBAsuJIDAAAMFLcQ4zX65XD4Qi5uN1u+3rLsuT1epWXl6exY8dqzpw5OnXqVMg+AoGAVq9erYkTJ2rcuHFauHChLly4EO+lAgAAgw3JkZi/+Iu/0MWLF+3LiRMn7Os2b96sLVu2aNu2bTp27JjcbrdKS0t19epVu6aqqkoNDQ2qr6/XkSNHdO3aNZWXl6u7u3solgsAAAw0JO+JSU1NDTn60suyLL300kt67rnntHjxYknS66+/rpycHNXV1WnlypXy+/3auXOn9uzZo3nz5kmS9u7dq/z8fB06dEhlZWVDsWQAAGCYITkS88knnygvL08FBQX6m7/5G/3P//yPJOns2bNqa2uTx+Oxa51Op2bPnq3m5mZJUktLi4LBYEhNXl6eioqK7BoAAIC4H4mZMWOG3njjDU2ZMkWXLl3SL3/5S82aNUunTp1SW1ubJCknJydkTk5Ojj777DNJUltbm0aPHq3x48eH1fTOjyQQCCgQCNjbnZ2dkqRgMKhgMBjV2nvroq1HfDlTrG/+HfV///btRW/Ntw2m5la3f7v7TraaSPrOizTn233otyaa/cSpZqA5keaZWNPf9b196G/OcPYikT1NFJ4fhk8sj7HDsqzwn5o4un79uu655x4988wzmjlzph588EF9+eWXys3NtWtWrFih8+fPq7GxUXV1dVq2bFlIIJGk0tJS3XPPPXrllVci3o7X69WGDRvCxuvq6pSenh7fOwUAAIbEjRs3VFFRIb/fr8zMzFvWDvnnxIwbN07Tpk3TJ598okWLFkn65mjLt0NMe3u7fXTG7Xarq6tLHR0dIUdj2tvbNWvWrH5vZ/369aqurra3Ozs7lZ+fL4/HM+CD0CsYDMrn86m0tFRpaWmx3E3EQZH3gKRv/o/zF9N79PzxUWr5f/Mj1nzbSW9ZzDW3uv3b3Xey1UTSd16kOcUvNtp9CPQ4ItZEs5941Qw0J9I8E2v66v271NuH/uYMZy8S2dNE4flh+PS+khKNIQ8xgUBAp0+f1g9/+EMVFBTI7XbL5/PpL//yLyVJXV1dampq0j/+4z9KkoqLi5WWliafz6clS5ZIki5evKiTJ09q8+bN/d6O0+mU0+kMG09LS4v5B24wc3D7At2O0O0eR1gf+tZIGlRNNLc/2H0nW00kfedFmtP7hBnocSjQHd6LqPcTp5qB5kSaZ2JNf3r70N+c4exFInuaaDw/DL1YHt+4h5i1a9fq0Ucf1V133aX29nb98pe/VGdnp5YuXSqHw6GqqirV1NSosLBQhYWFqqmpUXp6uioqKiRJLpdLy5cv15o1azRhwgRlZWVp7dq1mjZtmn22EgDgztT7yd7fdm7TIwlYCZJB3EPMhQsX9Ld/+7f6/e9/r+9973uaOXOmjh49qsmTJ0uSnnnmGd28eVNPPvmkOjo6NGPGDB08eFAZGRn2PrZu3arU1FQtWbJEN2/e1Ny5c7V7926lpKTEe7kAAMBQcQ8x9fX1t7ze4XDI6/XK6/X2WzNmzBjV1taqtrY2zqsDAAAjBd+dBAAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASIQYAABgJEIMAAAwEiEGAAAYiRADAACMRIgBAABGGvJvsQYkvrQNABB/HIkBAABGIsQAAAAjEWIAAICRCDEAAMBIhBgAAGAkQgwAADASIQYAABiJz4kBAIwofC7VnYMjMQAAwEiEGAAAYCRCDAAAMBIhBgAAGIkQAwAAjESIAQAARiLEAAAAIxFiAACAkQgxAADASIQYAABgJEIMAAAwEiEGAAAYiRADAACMxLdYAwDuSH2/7ZpvujYPR2IAAICRCDEAAMBIhBgAAGAk3hOD29b3dWWJ15YBAEOPIzEAAMBIhBgAAGAkQgwAADASIQYAABiJEAMAAIzE2UkAAPSj9+xLZ4qlzQ8keDEIw5EYAABgJEIMAAAwEiEGAAAYiRADAACMxBt7cUt8pQAAIFlxJAYAABiJEAMAAIzEy0kAANyGvi+785L78OFIDAAAMBJHYkYI/k8AAHCnIcTcQQg6AICRhBAzhOIVGggfADCy8PEV8ZH074l5+eWXVVBQoDFjxqi4uFjvv/9+opcUV3ev2x9yAQAA0UnqIzH79u1TVVWVXn75ZT344IPasWOHFixYoP/+7//WXXfdlejlAQAwZDhaM7CkDjFbtmzR8uXL9Q//8A+SpJdeekkHDhzQ9u3btXHjxoSujZd4AACJdqcHnaQNMV1dXWppadG6detCxj0ej5qbm8PqA4GAAoGAve33+yVJf/jDHxQMBqO6zWAwqBs3bujy5ctKS0u7ZW3q19dDti9fvjwiagaaE2levGtSeyzduNGj1OCoIbutSBJxX4ejJpKofl6C1+0+dPc4+Nkcppq+ev8u9fahvznJ9rck2Xsa7Rr7/l2K9Pxgwn01ydWrVyVJlmUNXGwlqS+++MKSZP3Hf/xHyPivfvUra8qUKWH1L7zwgiWJCxcuXLhw4TICLufPnx8wKyTtkZheDocjZNuyrLAxSVq/fr2qq6vt7Z6eHv3hD3/QhAkTItZH0tnZqfz8fJ0/f16ZmZm3t3AMGn1IDvQhOdCH5EAfho9lWbp69ary8vIGrE3aEDNx4kSlpKSora0tZLy9vV05OTlh9U6nU06nM2Tsu9/97qBuOzMzkx/SJEAfkgN9SA70ITnQh+HhcrmiqkvaU6xHjx6t4uJi+Xy+kHGfz6dZs2YlaFUAACBZJO2RGEmqrq5WZWWlpk+frpKSEr366qv6/PPP9cQTTyR6aQAAIMGSOsT87Gc/0+XLl/Xiiy/q4sWLKioq0rvvvqvJkycPye05nU698MILYS9LYXjRh+RAH5IDfUgO9CE5OSwrmnOYAAAAkkvSvicGAADgVggxAADASIQYAABgJEIMAAAwEiHm/3v55ZdVUFCgMWPGqLi4WO+//36ilzTiHT58WI8++qjy8vLkcDj01ltvhVxvWZa8Xq/y8vI0duxYzZkzR6dOnUrMYkeojRs36v7771dGRoays7O1aNEinTlzJqSGPgy97du36/vf/779QWolJSX693//d/t6epAYGzdulMPhUFVVlT1GL5ILIUbSvn37VFVVpeeee07/9V//pR/+8IdasGCBPv/880QvbUS7fv267rvvPm3bti3i9Zs3b9aWLVu0bds2HTt2TG63W6WlpfaXg+H2NTU1adWqVTp69Kh8Pp++/vpreTweXb/+f18qRx+G3qRJk7Rp0yYdP35cx48f149+9CP9+Mc/tp8c6cHwO3bsmF599VV9//vfDxmnF0nmtr+pcQR44IEHrCeeeCJk7M/+7M+sdevWJWhFdx5JVkNDg73d09Njud1ua9OmTfbYH//4R8vlclmvvPJKAlZ4Z2hvb7ckWU1NTZZl0YdEGj9+vPWv//qv9CABrl69ahUWFlo+n8+aPXu29fOf/9yyLH4fktEdfySmq6tLLS0t8ng8IeMej0fNzc0JWhXOnj2rtra2kL44nU7Nnj2bvgwhv98vScrKypJEHxKhu7tb9fX1un79ukpKSuhBAqxatUqPPPKI5s2bFzJOL5JPUn9i73D4/e9/r+7u7rAvlczJyQn78kkMn97HPlJfPvvss0QsacSzLEvV1dX6wQ9+oKKiIkn0YTidOHFCJSUl+uMf/6jvfOc7amho0J//+Z/bT470YHjU19frP//zP3Xs2LGw6/h9SD53fIjp5XA4QrYtywobw/CjL8Pnqaee0u9+9zsdOXIk7Dr6MPSmTp2q1tZWXblyRf/2b/+mpUuXqqmpyb6eHgy98+fP6+c//7kOHjyoMWPG9FtHL5LHHf9y0sSJE5WSkhJ21KW9vT0sbWP4uN1uSaIvw2T16tV655139Nvf/laTJk2yx+nD8Bk9erT+9E//VNOnT9fGjRt133336Z/+6Z/owTBqaWlRe3u7iouLlZqaqtTUVDU1Nemf//mflZqaaj/e9CJ53PEhZvTo0SouLpbP5wsZ9/l8mjVrVoJWhYKCArnd7pC+dHV1qampib7EkWVZeuqpp/TrX/9av/nNb1RQUBByPX1IHMuyFAgE6MEwmjt3rk6cOKHW1lb7Mn36dP3d3/2dWltb9Sd/8if0IsnwcpKk6upqVVZWavr06SopKdGrr76qzz//XE888USilzaiXbt2TZ9++qm9ffbsWbW2tiorK0t33XWXqqqqVFNTo8LCQhUWFqqmpkbp6emqqKhI4KpHllWrVqmurk5vv/22MjIy7P/DdLlcGjt2rP0ZGfRhaD377LNasGCB8vPzdfXqVdXX1+u9995TY2MjPRhGGRkZ9vvBeo0bN04TJkywx+lFkknciVHJ5V/+5V+syZMnW6NHj7b+6q/+yj7FFEPnt7/9rSUp7LJ06VLLsr45nfGFF16w3G635XQ6rYceesg6ceJEYhc9wkR6/CVZu3btsmvow9D7+7//e/vvz/e+9z1r7ty51sGDB+3r6UHifPsUa8uiF8nGYVmWlaD8BAAAMGh3/HtiAACAmQgxAADASIQYAABgJEIMAAAwEiEGAAAYiRADAACMRIgBAABGIsQAAAAjEWIAAICRCDEAAMBIhBgAAGAkQgwAADDS/wI9witl6xdjkwAAAABJRU5ErkJggg==",
                        "text/plain": [
                            "<Figure size 640x480 with 1 Axes>"
                        ]
                    },
                    "metadata": {},
                    "output_type": "display_data"
                }
            ],
            "source": [
                "df_var_num.hist(bins=100)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 50,
            "id": "f2f8baff",
            "metadata": {},
            "outputs": [
                {
                    "name": "stdout",
                    "output_type": "stream",
                    "text": [
                        "ids_selected_by_vars:  (53560,)\n"
                    ]
                }
            ],
            "source": [
                "ids_selected_by_vars = df_var_num.loc[df_var_num >= 10].index\n",
                "\n",
                "print(\"ids_selected_by_vars: \", ids_selected_by_vars.shape)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 51,
            "id": "33139d2e",
            "metadata": {},
            "outputs": [
                {
                    "data": {
                        "text/plain": [
                            "22591"
                        ]
                    },
                    "execution_count": 51,
                    "metadata": {},
                    "output_type": "execute_result"
                }
            ],
            "source": [
                "ids_selected = set(ids_before_selected) & set(ids_after_selected) & set(ids_selected_by_vars)\n",
                "len(ids_selected)"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 52,
            "id": "92e6f7e2",
            "metadata": {},
            "outputs": [],
            "source": [
                "complete_df = complete_df.loc[list(ids_selected)]"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": 53,
            "id": "b79f6639",
            "metadata": {},
            "outputs": [],
            "source": [
                "complete_df.to_csv(\n",
                "    path_m4/'processed/mimic4_full_dataset.csv')"
            ]
        },
        {
            "cell_type": "code",
            "execution_count": null,
            "id": "94f80aae",
            "metadata": {},
            "outputs": [],
            "source": []
        }
    ],
    "metadata": {
        "kernelspec": {
            "display_name": "Python 3.8.12 ('transfer_ehr')",
            "language": "python",
            "name": "python3"
        },
        "language_info": {
            "codemirror_mode": {
                "name": "ipython",
                "version": 3
            },
            "file_extension": ".py",
            "mimetype": "text/x-python",
            "name": "python",
            "nbconvert_exporter": "python",
            "pygments_lexer": "ipython3",
            "version": "3.10.8"
        },
        "vscode": {
            "interpreter": {
                "hash": "5ae865abb88ad0a991db65fb0a3113ce9d7dd5f50b65ef8b203d3356ff36831c"
            }
        }
    },
    "nbformat": 4,
    "nbformat_minor": 5
}
