{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/hjlee/.conda/envs/hydra/lib/python3.9/site-packages/tqdm/auto.py:22: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
      "  from .autonotebook import tqdm as notebook_tqdm\n"
     ]
    }
   ],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import torch\n",
    "from torch.utils.data import Dataset\n",
    "\n",
    "from sklearn.preprocessing import LabelEncoder\n",
    "from sklearn.utils import shuffle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "def getBinary(df, cols):\n",
    "    labels = df[cols].apply(lambda s: np.median(s)).values\n",
    "    x = df[cols].values\n",
    "    xs = np.zeros_like(x)\n",
    "    for j in range(len(labels)):\n",
    "        if x[:,j].max() == labels[j]:\n",
    "            xs[:,j] = x[:,j]\n",
    "        else:\n",
    "            xs[:,j] = (x[:,j] > labels[j]).astype(int)\n",
    "    df = pd.DataFrame(xs, columns=cols)\n",
    "    return df.astype('category')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Data Sources\n",
    "\n",
    "- **Adult.data, Adult.test:** https://archive.ics.uci.edu/ml/datasets/adult\n",
    "- **Health.csv:** https://github.com/SoftWiser-group/FairDisCo"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Adult"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "cols = ['age', 'workclass', 'fnlwgt', 'education', 'education-num', 'marital-status', 'occupation', \\\n",
    "        'relationship', 'race', 'sex', 'capital-gain', 'capital-loss','hours-per-week', 'native-country', 'salary']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "train_size 32561, test_size 16281\n"
     ]
    }
   ],
   "source": [
    "df_train = pd.read_csv(\"/home/hjlee/FairDisCo/data/Adult/adult.data\", names=cols)\n",
    "df_test = pd.read_csv(\"/home/hjlee/FairDisCo/data/Adult/adult.test\", names=cols, skiprows=1)\n",
    "\n",
    "num_train = df_train.shape[0]\n",
    "num_test = df_test.shape[0]\n",
    "df = pd.concat([df_train, df_test], ignore_index=True)\n",
    "df = df.apply(lambda v: v.astype(str).str.strip() if v.dtype == \"object\" else v)\n",
    "print('train_size {}, test_size {}'.format(num_train, num_test))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Remove missing values(' ?')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "train_size 30162, test_size 15060\n"
     ]
    }
   ],
   "source": [
    "df_train = pd.read_csv('/home/hjlee/FairDisCo/data/Adult/adult.data', names=cols)\n",
    "df_test = pd.read_csv('/home/hjlee/FairDisCo/data/Adult/adult.test', names=cols, skiprows=1)\n",
    "\n",
    "# Filtering ? value\n",
    "for j in range(df_train.shape[1]):\n",
    "    df_train = df_train[df_train.iloc[:, j] != ' ?']\n",
    "    df_test = df_test[df_test.iloc[:, j] != ' ?']\n",
    "\n",
    "num_train = df_train.shape[0]\n",
    "num_test = df_test.shape[0]\n",
    "df = pd.concat([df_train, df_test], ignore_index=True)\n",
    "df = df.apply(lambda v: v.astype(str).str.strip() if v.dtype == \"object\" else v)\n",
    "print('train_size {}, test_size {}'.format(num_train, num_test))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Discretize the continuous variables"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "df['age'] = pd.cut(df['age'], bins=5)\n",
    "df['hours-per-week'] = pd.cut(df['hours-per-week'], bins=5)\n",
    "df['fnlwgt'] = pd.cut(np.log(df['fnlwgt']), bins=5)\n",
    "df[['capital-gain', 'capital-loss']] = getBinary(df, ['capital-gain', 'capital-loss'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "S = (df['sex'] == 'Male').values.astype(int)\n",
    "Y = (df['salary'].apply(lambda x: x == '<=50K' or x == '<=50K.')).values.astype(int)\n",
    "del df['salary']\n",
    "del df['sex']\n",
    "del df['education-num']\n",
    "# dset_adult = getDataset(df, S, Y, num_train)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = pd.get_dummies(df)\n",
    "data['label'] = Y\n",
    "data['sex'] = S"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "data structure: X(115), Y(1), S(1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.save('../data/adult_train', data.iloc[:num_train, :])\n",
    "np.save('../data/adult_test', data.iloc[num_train:, :])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "# import pickle\n",
    "# with open('adult_train.pkl', 'wb') as f:\n",
    "#     pickle.dump(data.iloc[:num_train, :], f)\n",
    "\n",
    "# with open('adult_test.pkl', 'wb') as f:\n",
    "#     pickle.dump(data.iloc[num_train:, :], f)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "----------------------"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Health"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "train_size 44116, test_size 11030\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(2022)\n",
    "df = pd.read_csv('../FairDisCo/data/Health.csv')\n",
    "df = df[df['YEAR_t'].isin(['Y2'])]\n",
    "df = df[(df['sexMISS'] == 0)&(df['age_MISS'] == 0)]\n",
    "df = shuffle(df).reset_index(drop=True)\n",
    "\n",
    "num_train = int(df.shape[0]*0.8)\n",
    "print('train_size {}, test_size {}'.format(num_train, df.shape[0]-num_train))\n",
    "\n",
    "age = df[['age_%d5' % (i) for i in range(0, 9)]].values.argmax(axis=1)\n",
    "sex = df[['sexMALE', 'sexFEMALE']].values.argmax(axis=1)\n",
    "\n",
    "Y = (df['DaysInHospital'] > 0).values.astype(int)\n",
    "drop_cols = ['age_%d5' % (i) for i in range(0, 9)] + ['sexMALE', 'sexFEMALE',  'sexMISS', 'age_MISS', 'trainset', 'DaysInHospital', 'MemberID_t', 'YEAR_t']\n",
    "\n",
    "df = df.drop(drop_cols, axis=1)\n",
    "df = getBinary(df, df.columns)\n",
    "\n",
    "df['sex'] = sex\n",
    "S = (age > 6).astype(int)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>ClaimsTruncated_0.0</th>\n",
       "      <th>ClaimsTruncated_1.0</th>\n",
       "      <th>no_Claims_0.0</th>\n",
       "      <th>no_Claims_1.0</th>\n",
       "      <th>no_Providers_0.0</th>\n",
       "      <th>no_Providers_1.0</th>\n",
       "      <th>no_Vendors_0.0</th>\n",
       "      <th>no_Vendors_1.0</th>\n",
       "      <th>no_PCPs_0.0</th>\n",
       "      <th>no_PCPs_1.0</th>\n",
       "      <th>...</th>\n",
       "      <th>labCount_ave_0.0</th>\n",
       "      <th>labCount_ave_1.0</th>\n",
       "      <th>labcount_months_0.0</th>\n",
       "      <th>labcount_months_1.0</th>\n",
       "      <th>labNull_0.0</th>\n",
       "      <th>labNull_1.0</th>\n",
       "      <th>drugNull_0.0</th>\n",
       "      <th>drugNull_1.0</th>\n",
       "      <th>sex_0</th>\n",
       "      <th>sex_1</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>55141</th>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>55142</th>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>55143</th>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>55144</th>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>55145</th>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>55146 rows × 254 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       ClaimsTruncated_0.0  ClaimsTruncated_1.0  no_Claims_0.0  no_Claims_1.0  \\\n",
       "0                        1                    0              0              1   \n",
       "1                        0                    1              0              1   \n",
       "2                        1                    0              0              1   \n",
       "3                        1                    0              0              1   \n",
       "4                        1                    0              0              1   \n",
       "...                    ...                  ...            ...            ...   \n",
       "55141                    1                    0              0              1   \n",
       "55142                    1                    0              1              0   \n",
       "55143                    0                    1              0              1   \n",
       "55144                    1                    0              1              0   \n",
       "55145                    1                    0              1              0   \n",
       "\n",
       "       no_Providers_0.0  no_Providers_1.0  no_Vendors_0.0  no_Vendors_1.0  \\\n",
       "0                     1                 0               1               0   \n",
       "1                     0                 1               0               1   \n",
       "2                     0                 1               0               1   \n",
       "3                     0                 1               0               1   \n",
       "4                     1                 0               1               0   \n",
       "...                 ...               ...             ...             ...   \n",
       "55141                 1                 0               1               0   \n",
       "55142                 1                 0               1               0   \n",
       "55143                 0                 1               0               1   \n",
       "55144                 1                 0               1               0   \n",
       "55145                 1                 0               1               0   \n",
       "\n",
       "       no_PCPs_0.0  no_PCPs_1.0  ...  labCount_ave_0.0  labCount_ave_1.0  \\\n",
       "0                1            0  ...                 0                 1   \n",
       "1                1            0  ...                 0                 1   \n",
       "2                1            0  ...                 0                 1   \n",
       "3                1            0  ...                 0                 1   \n",
       "4                1            0  ...                 0                 1   \n",
       "...            ...          ...  ...               ...               ...   \n",
       "55141            1            0  ...                 0                 1   \n",
       "55142            1            0  ...                 0                 1   \n",
       "55143            1            0  ...                 0                 1   \n",
       "55144            1            0  ...                 1                 0   \n",
       "55145            1            0  ...                 0                 1   \n",
       "\n",
       "       labcount_months_0.0  labcount_months_1.0  labNull_0.0  labNull_1.0  \\\n",
       "0                        0                    1            1            0   \n",
       "1                        0                    1            1            0   \n",
       "2                        0                    1            1            0   \n",
       "3                        0                    1            1            0   \n",
       "4                        0                    1            1            0   \n",
       "...                    ...                  ...          ...          ...   \n",
       "55141                    0                    1            1            0   \n",
       "55142                    1                    0            1            0   \n",
       "55143                    0                    1            1            0   \n",
       "55144                    1                    0            0            1   \n",
       "55145                    1                    0            1            0   \n",
       "\n",
       "       drugNull_0.0  drugNull_1.0  sex_0  sex_1  \n",
       "0                 0             1      1      0  \n",
       "1                 1             0      1      0  \n",
       "2                 1             0      1      0  \n",
       "3                 0             1      0      1  \n",
       "4                 1             0      0      1  \n",
       "...             ...           ...    ...    ...  \n",
       "55141             1             0      0      1  \n",
       "55142             1             0      1      0  \n",
       "55143             1             0      0      1  \n",
       "55144             1             0      0      1  \n",
       "55145             0             1      0      1  \n",
       "\n",
       "[55146 rows x 254 columns]"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df['sex'] = df['sex'].astype('category')\n",
    "pd.get_dummies(df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_32774/1642803216.py:2: PerformanceWarning: DataFrame is highly fragmented.  This is usually the result of calling `frame.insert` many times, which has poor performance.  Consider joining all columns at once using pd.concat(axis=1) instead. To get a de-fragmented frame, use `newframe = frame.copy()`\n",
      "  data_health['label'] = Y\n",
      "/tmp/ipykernel_32774/1642803216.py:3: PerformanceWarning: DataFrame is highly fragmented.  This is usually the result of calling `frame.insert` many times, which has poor performance.  Consider joining all columns at once using pd.concat(axis=1) instead. To get a de-fragmented frame, use `newframe = frame.copy()`\n",
      "  data_health['sex'] = S\n"
     ]
    }
   ],
   "source": [
    "data_health = pd.get_dummies(df)\n",
    "data_health['label'] = Y\n",
    "data_health['sex'] = S"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.save('../data/health_train', data_health.iloc[:num_train, :])\n",
    "np.save('../data/health_test', data_health.iloc[num_train:, :])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [],
   "source": [
    "# with open('health_train.pkl', 'wb') as f:\n",
    "#     pickle.dump(data_health.iloc[:num_train, :], f)\n",
    "\n",
    "# with open('health_test.pkl', 'wb') as f:\n",
    "#     pickle.dump(data_health.iloc[num_train:, :], f)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "hydra",
   "language": "python",
   "name": "hydra"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
