{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "82beccaa-e829-4712-99e5-014dfb189c59",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "from scipy.spatial.distance import cdist\n",
    "import random\n",
    "from sklearn.cluster import KMeans\n",
    "import sys\n",
    "sys.path.append('../')\n",
    "from icfesl import *\n",
    "from utility_functions import *\n",
    "from sklearn.feature_selection import VarianceThreshold\n",
    "from xgboost import XGBRegressor\n",
    "from pytorch_tabnet.tab_model import TabNetRegressor\n",
    "from sklearn.mixture import GaussianMixture\n",
    "import time\n",
    "from sklearn.model_selection import train_test_split\n",
    "import matplotlib.pyplot as plt\n",
    "from feature_engine.datetime import DatetimeFeatures\n",
    "from catboost import CatBoostRegressor, Pool\n",
    "from sklearn.preprocessing import LabelEncoder"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "9706d06e-64c7-49e9-b15f-4f49265fcc85",
   "metadata": {},
   "outputs": [],
   "source": [
    "path = \"../../../writing/kaggle dataset/US_Air_quality/aqi_data_17_21.csv\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "0df55b74-b7c9-4855-91c3-4f6d09285c5b",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/var/folders/j7/w07zs41n4s5df3svj9ygmh9h0000gn/T/ipykernel_3950/2200478113.py:1: DtypeWarning: Columns (11) have mixed types. Specify dtype option on import or set low_memory=False.\n",
      "  raw_data = pd.read_csv(path)\n"
     ]
    }
   ],
   "source": [
    "raw_data = pd.read_csv(path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "ac4d8aec-62dc-4f9e-9e94-78d8df16478f",
   "metadata": {},
   "outputs": [],
   "source": [
    "raw_data.units_of_measure = raw_data.units_of_measure.astype(str)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "c7f13a08-04a4-4a54-be0f-1be94827f21b",
   "metadata": {},
   "outputs": [],
   "source": [
    "raw_data = raw_data.loc[raw_data['sample_duration']=='24 HOUR']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "b69f4e10-0d2b-4de4-9a23-e91aafcadefb",
   "metadata": {},
   "outputs": [],
   "source": [
    "dtf = DatetimeFeatures(features_to_extract=[\"month\", 'hour'])\n",
    "\n",
    "date_features = dtf.fit_transform(raw_data[['date_local']])\n",
    "\n",
    "raw_data = pd.concat([raw_data, date_features], axis=1).sample(n=100000, random_state = 200)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "0667d9b1-a73c-4285-a3e8-fc6db996386f",
   "metadata": {},
   "outputs": [],
   "source": [
    "cat_vars = ['site_number','method','first_max_hour', 'state','county','city','date_local_month','date_local_hour']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "0baca774-cc85-40e9-a600-1f9021ac5b56",
   "metadata": {},
   "outputs": [],
   "source": [
    "X = raw_data[cat_vars]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "9614c1d2-1460-43c1-ab28-218643753fe4",
   "metadata": {},
   "outputs": [],
   "source": [
    "y = raw_data['aqi']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "6b5e6aa7-4a60-4387-9f37-a422218857df",
   "metadata": {},
   "outputs": [],
   "source": [
    "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "0de93675-5e5b-4035-b355-e6d1e55e9630",
   "metadata": {},
   "outputs": [],
   "source": [
    "X_train = X_train.reset_index(drop=True)\n",
    "X_test = X_test.reset_index(drop=True)\n",
    "y_train = y_train.reset_index(drop=True)\n",
    "y_test = y_test.reset_index(drop=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "97f8335a-581d-4444-be09-9c4a384e8fef",
   "metadata": {},
   "outputs": [],
   "source": [
    "X2, encoder = icfesl.f_get_dummies(X_train, cat_vars)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "8db04298-4609-4666-bf42-70effe7dde00",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/opt/anaconda3/lib/python3.13/site-packages/sklearn/preprocessing/_encoders.py:246: UserWarning: Found unknown categories in columns [2, 5] during transform. These unknown categories will be encoded as all zeros\n",
      "  warnings.warn(\n"
     ]
    }
   ],
   "source": [
    "X2_test = icfesl.f_get_dummies(X_test, cat_vars, encoder=encoder)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "34a046e4-07d5-45ce-9f09-5ef030e0383c",
   "metadata": {},
   "outputs": [],
   "source": [
    "selector = VarianceThreshold()\n",
    "\n",
    "selector.fit(X2)\n",
    "\n",
    "selected_features_mask = selector.get_support()\n",
    "\n",
    "selected_column_names = X2.columns[selected_features_mask]\n",
    "\n",
    "X2 = X2[selected_column_names]\n",
    "\n",
    "X2_test = X2_test[selected_column_names]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "f14516c9-cb0a-4a1a-aeef-da52fb19ccf3",
   "metadata": {},
   "outputs": [],
   "source": [
    "for c in X2.columns.tolist():\n",
    "    X2[c] = X2[c].astype('int')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "c92afd8c-6758-4df9-9bd0-a323d34f9957",
   "metadata": {},
   "outputs": [],
   "source": [
    "for c in X2_test.columns.tolist():\n",
    "    X2_test[c] = X2_test[c].astype('int')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "c7d8a241-85c1-451d-86e9-4faa3e807d54",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(70000, 1191)"
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "X2.shape"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "4f9efe23-76f4-49e5-9130-053c9680dd64",
   "metadata": {},
   "source": [
    "### ICFESL"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "95eed9eb-f300-40a6-b9d4-dd749b7e3769",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m2025-12-02 21:07:42.140\u001b[0m | \u001b[1mINFO    \u001b[0m | \u001b[36micfesl\u001b[0m:\u001b[36mregularized_search_algorun\u001b[0m:\u001b[36m397\u001b[0m - \u001b[1mrunning algorithm with L2 regularization factor = 0.2 ------>\u001b[0m\n",
      "\u001b[32m2025-12-02 21:09:15.864\u001b[0m | \u001b[1mINFO    \u001b[0m | \u001b[36micfesl\u001b[0m:\u001b[36mregularized_search_algorun\u001b[0m:\u001b[36m453\u001b[0m - \u001b[1mRunning OLS with ICFESL encoding\u001b[0m\n",
      "\u001b[32m2025-12-02 21:09:16.484\u001b[0m | \u001b[1mINFO    \u001b[0m | \u001b[36micfesl\u001b[0m:\u001b[36mregularized_search_algorun\u001b[0m:\u001b[36m471\u001b[0m - \u001b[1mRunning xgbRegressor with ICFESL encoding\u001b[0m\n",
      "\u001b[32m2025-12-02 21:09:17.031\u001b[0m | \u001b[1mINFO    \u001b[0m | \u001b[36micfesl\u001b[0m:\u001b[36mregularized_search_algorun\u001b[0m:\u001b[36m485\u001b[0m - \u001b[1mCompleted: running algorithm with L2 regularization factor = 0.2 ------>\u001b[0m\n",
      "\u001b[32m2025-12-02 21:09:17.032\u001b[0m | \u001b[1mINFO    \u001b[0m | \u001b[36micfesl\u001b[0m:\u001b[36mregularized_search_algorun\u001b[0m:\u001b[36m397\u001b[0m - \u001b[1mrunning algorithm with L2 regularization factor = 0.5 ------>\u001b[0m\n",
      "\u001b[32m2025-12-02 21:11:24.747\u001b[0m | \u001b[1mINFO    \u001b[0m | \u001b[36micfesl\u001b[0m:\u001b[36mregularized_search_algorun\u001b[0m:\u001b[36m453\u001b[0m - \u001b[1mRunning OLS with ICFESL encoding\u001b[0m\n",
      "\u001b[32m2025-12-02 21:11:25.455\u001b[0m | \u001b[1mINFO    \u001b[0m | \u001b[36micfesl\u001b[0m:\u001b[36mregularized_search_algorun\u001b[0m:\u001b[36m471\u001b[0m - \u001b[1mRunning xgbRegressor with ICFESL encoding\u001b[0m\n",
      "\u001b[32m2025-12-02 21:11:26.030\u001b[0m | \u001b[1mINFO    \u001b[0m | \u001b[36micfesl\u001b[0m:\u001b[36mregularized_search_algorun\u001b[0m:\u001b[36m485\u001b[0m - \u001b[1mCompleted: running algorithm with L2 regularization factor = 0.5 ------>\u001b[0m\n"
     ]
    }
   ],
   "source": [
    "fit_info_panel, index_of_best, figs, cluster_groups, criterions, inertias, gap_statss = icfesl.regularized_search_algorun(\n",
    "        X2, y_train, X2_test, y_test, cat_vars, 'regression', alphas = [0.2, 0.5],\n",
    "        cbine_column=False, distance_threshold=0.005, figure=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "9139ee6e-1f9f-4834-961e-fa45bf6fe245",
   "metadata": {},
   "outputs": [],
   "source": [
    "decision_plot, summary_plot = figs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "249dd729-9c39-47e6-9a7d-9fa33799607f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Experiment</th>\n",
       "      <th>dof</th>\n",
       "      <th>reg_fit_time</th>\n",
       "      <th>reg_training_rmse</th>\n",
       "      <th>reg_testing_rmse</th>\n",
       "      <th>xgb_fit_time</th>\n",
       "      <th>xgb_training_rmse</th>\n",
       "      <th>xgb_testing_rmse</th>\n",
       "      <th>var_inf</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>152.0</td>\n",
       "      <td>0.5261</td>\n",
       "      <td>17.483796</td>\n",
       "      <td>18.015862</td>\n",
       "      <td>0.4927</td>\n",
       "      <td>16.595690</td>\n",
       "      <td>17.441367</td>\n",
       "      <td>4.418721e-10</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>178.0</td>\n",
       "      <td>0.6059</td>\n",
       "      <td>17.471263</td>\n",
       "      <td>18.011565</td>\n",
       "      <td>0.5150</td>\n",
       "      <td>16.534453</td>\n",
       "      <td>17.343387</td>\n",
       "      <td>2.075008e-10</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Experiment    dof  reg_fit_time  reg_training_rmse  reg_testing_rmse  \\\n",
       "0           0  152.0        0.5261          17.483796         18.015862   \n",
       "1           1  178.0        0.6059          17.471263         18.011565   \n",
       "\n",
       "   xgb_fit_time  xgb_training_rmse  xgb_testing_rmse       var_inf  \n",
       "0        0.4927          16.595690         17.441367  4.418721e-10  \n",
       "1        0.5150          16.534453         17.343387  2.075008e-10  "
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "fit_info_panel"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "c29881f4-a3d9-4ef4-84a7-ceb656bd7acf",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'site_number+0': ['site_number::27',\n",
       "  'site_number::59',\n",
       "  'site_number::97',\n",
       "  'site_number::128'],\n",
       " 'site_number+1': ['site_number::14',\n",
       "  'site_number::25',\n",
       "  'site_number::32',\n",
       "  'site_number::34',\n",
       "  'site_number::39',\n",
       "  'site_number::73',\n",
       "  'site_number::79',\n",
       "  'site_number::93',\n",
       "  'site_number::103',\n",
       "  'site_number::500',\n",
       "  'site_number::922',\n",
       "  'site_number::1002',\n",
       "  'site_number::1016',\n",
       "  'site_number::1034',\n",
       "  'site_number::1053',\n",
       "  'site_number::2022',\n",
       "  'site_number::4004',\n",
       "  'site_number::7550',\n",
       "  'site_number::7554'],\n",
       " 'site_number+2': ['site_number::15',\n",
       "  'site_number::23',\n",
       "  'site_number::133',\n",
       "  'site_number::1046',\n",
       "  'site_number::1302',\n",
       "  'site_number::4008'],\n",
       " 'site_number+3': ['site_number::6',\n",
       "  'site_number::24',\n",
       "  'site_number::26',\n",
       "  'site_number::28',\n",
       "  'site_number::31',\n",
       "  'site_number::50',\n",
       "  'site_number::56',\n",
       "  'site_number::91',\n",
       "  'site_number::1037'],\n",
       " 'site_number+4': ['site_number::30',\n",
       "  'site_number::1012',\n",
       "  'site_number::3001'],\n",
       " 'site_number+5': ['site_number::45',\n",
       "  'site_number::60',\n",
       "  'site_number::65',\n",
       "  'site_number::561',\n",
       "  'site_number::1013',\n",
       "  'site_number::1026',\n",
       "  'site_number::2123'],\n",
       " 'site_number+6': ['site_number::5',\n",
       "  'site_number::22',\n",
       "  'site_number::76',\n",
       "  'site_number::100',\n",
       "  'site_number::101',\n",
       "  'site_number::124',\n",
       "  'site_number::415',\n",
       "  'site_number::1039',\n",
       "  'site_number::2009',\n",
       "  'site_number::2059',\n",
       "  'site_number::5002'],\n",
       " 'site_number+7': ['site_number::12',\n",
       "  'site_number::41',\n",
       "  'site_number::80',\n",
       "  'site_number::1020',\n",
       "  'site_number::1235',\n",
       "  'site_number::4201'],\n",
       " 'site_number+8': ['site_number::11',\n",
       "  'site_number::87',\n",
       "  'site_number::110',\n",
       "  'site_number::114',\n",
       "  'site_number::125',\n",
       "  'site_number::540',\n",
       "  'site_number::1001',\n",
       "  'site_number::1010',\n",
       "  'site_number::1017',\n",
       "  'site_number::1041',\n",
       "  'site_number::2002',\n",
       "  'site_number::2013',\n",
       "  'site_number::3006',\n",
       "  'site_number::3103'],\n",
       " 'site_number+9': ['site_number::98', 'site_number::99'],\n",
       " 'site_number+10': ['site_number::13',\n",
       "  'site_number::44',\n",
       "  'site_number::67',\n",
       "  'site_number::868',\n",
       "  'site_number::1003',\n",
       "  'site_number::1008',\n",
       "  'site_number::1052',\n",
       "  'site_number::2004',\n",
       "  'site_number::3301',\n",
       "  'site_number::5001',\n",
       "  'site_number::7020',\n",
       "  'site_number::9997'],\n",
       " 'site_number+11': ['site_number::16',\n",
       "  'site_number::33',\n",
       "  'site_number::36',\n",
       "  'site_number::83',\n",
       "  'site_number::134',\n",
       "  'site_number::467',\n",
       "  'site_number::470',\n",
       "  'site_number::1005',\n",
       "  'site_number::1006',\n",
       "  'site_number::1024',\n",
       "  'site_number::1031',\n",
       "  'site_number::2129',\n",
       "  'site_number::5008'],\n",
       " 'site_number+12': ['site_number::17',\n",
       "  'site_number::1009',\n",
       "  'site_number::1068',\n",
       "  'site_number::3010',\n",
       "  'site_number::8005'],\n",
       " 'site_number+13': ['site_number::37',\n",
       "  'site_number::40',\n",
       "  'site_number::122',\n",
       "  'site_number::2003'],\n",
       " 'site_number+14': ['site_number::20',\n",
       "  'site_number::29',\n",
       "  'site_number::35',\n",
       "  'site_number::38',\n",
       "  'site_number::43',\n",
       "  'site_number::51',\n",
       "  'site_number::64',\n",
       "  'site_number::1069',\n",
       "  'site_number::3015'],\n",
       " 'site_number+15': ['site_number::3',\n",
       "  'site_number::8',\n",
       "  'site_number::10',\n",
       "  'site_number::19',\n",
       "  'site_number::78',\n",
       "  'site_number::84',\n",
       "  'site_number::1028',\n",
       "  'site_number::2001',\n",
       "  'site_number::2005',\n",
       "  'site_number::4002',\n",
       "  'site_number::8001'],\n",
       " 'site_number+16': ['site_number::9',\n",
       "  'site_number::55',\n",
       "  'site_number::95',\n",
       "  'site_number::1004',\n",
       "  'site_number::1011',\n",
       "  'site_number::1022',\n",
       "  'site_number::1103',\n",
       "  'site_number::1301',\n",
       "  'site_number::1602',\n",
       "  'site_number::2010',\n",
       "  'site_number::5005'],\n",
       " 'site_number+17': ['site_number::2',\n",
       "  'site_number::58',\n",
       "  'site_number::69',\n",
       "  'site_number::401',\n",
       "  'site_number::871',\n",
       "  'site_number::963',\n",
       "  'site_number::1123',\n",
       "  'site_number::2006',\n",
       "  'site_number::2011',\n",
       "  'site_number::2510',\n",
       "  'site_number::5010',\n",
       "  'site_number::6005',\n",
       "  'site_number::9004',\n",
       "  'site_number::9021'],\n",
       " 'site_number+18': ['site_number::18',\n",
       "  'site_number::42',\n",
       "  'site_number::48',\n",
       "  'site_number::52',\n",
       "  'site_number::57',\n",
       "  'site_number::75',\n",
       "  'site_number::1007',\n",
       "  'site_number::1015',\n",
       "  'site_number::1035',\n",
       "  'site_number::1201',\n",
       "  'site_number::3007',\n",
       "  'site_number::4001',\n",
       "  'site_number::6001'],\n",
       " 'site_number+19': ['site_number::4',\n",
       "  'site_number::7',\n",
       "  'site_number::21',\n",
       "  'site_number::49',\n",
       "  'site_number::81',\n",
       "  'site_number::85',\n",
       "  'site_number::505',\n",
       "  'site_number::1127',\n",
       "  'site_number::3002',\n",
       "  'site_number::5025',\n",
       "  'site_number::6006'],\n",
       " 'method+0': ['method::R & P Model 2000 PM-2.5 Air Sampler w/VSCC - Gravimetric',\n",
       "  'method::R & P Model 2025 PM-2.5 Sequential Air Sampler w/VSCC - Gravimetric'],\n",
       " 'method+1': ['method::Met One E-SEQ-FRM PM2.5 with VSCC - Gravimetric'],\n",
       " 'method+2': ['method::BGI Models PQ200-VSCC or PQ200A-VSCC - Gravimetric'],\n",
       " 'method+3': ['method::Met One E-FRM PM2.5 with VSCC - Gravimetric',\n",
       "  'method::R & P Model 2000 PM2.5 Sampler w/WINS - GRAVIMETRIC'],\n",
       " 'method+4': ['method::Thermo Electron Model RAAS2.5-300 Sequential w/VSCC - Gravimetric'],\n",
       " 'method+5': ['method::R & P Model 2025 PM2.5 Sequential w/WINS - GRAVIMETRIC'],\n",
       " 'method+6': ['method::Thermo Electron Model RAAS2.5-100 w/VSCC - Gravimetric'],\n",
       " 'method+7': ['method::Thermo Scientific Dichot. Partisol-Plus Model 2025-D Seq - Gravimetric'],\n",
       " 'state+0': ['state::Louisiana',\n",
       "  'state::Michigan',\n",
       "  'state::New Jersey',\n",
       "  'state::Ohio',\n",
       "  'state::West Virginia'],\n",
       " 'state+1': ['state::Connecticut',\n",
       "  'state::Massachusetts',\n",
       "  'state::New Hampshire',\n",
       "  'state::Rhode Island'],\n",
       " 'state+2': ['state::Georgia'],\n",
       " 'state+3': ['state::District Of Columbia',\n",
       "  'state::Minnesota',\n",
       "  'state::Montana',\n",
       "  'state::Utah',\n",
       "  'state::Vermont'],\n",
       " 'state+4': ['state::California', 'state::Illinois', 'state::Missouri'],\n",
       " 'state+5': ['state::Wyoming'],\n",
       " 'state+6': ['state::Hawaii', 'state::New York'],\n",
       " 'state+7': ['state::Washington'],\n",
       " 'state+8': ['state::Oregon', 'state::Texas'],\n",
       " 'state+9': ['state::Pennsylvania'],\n",
       " 'state+10': ['state::Nebraska', 'state::South Dakota', 'state::Wisconsin'],\n",
       " 'state+11': ['state::Iowa', 'state::Kentucky', 'state::Tennessee'],\n",
       " 'state+12': ['state::Arkansas', 'state::Indiana', 'state::Maryland'],\n",
       " 'state+13': ['state::Maine'],\n",
       " 'state+14': ['state::Colorado',\n",
       "  'state::Nevada',\n",
       "  'state::New Mexico',\n",
       "  'state::Virginia'],\n",
       " 'state+15': ['state::Idaho',\n",
       "  'state::Kansas',\n",
       "  'state::Mississippi',\n",
       "  'state::Puerto Rico',\n",
       "  'state::South Carolina'],\n",
       " 'state+16': ['state::Delaware',\n",
       "  'state::North Carolina',\n",
       "  'state::North Dakota'],\n",
       " 'state+17': ['state::Alaska',\n",
       "  'state::Arizona',\n",
       "  'state::Florida',\n",
       "  'state::Oklahoma'],\n",
       " 'county+0': ['county::Butler',\n",
       "  'county::Dane',\n",
       "  'county::Davidson',\n",
       "  'county::Daviess',\n",
       "  'county::Dona Ana',\n",
       "  'county::Duval',\n",
       "  'county::Fairfax',\n",
       "  'county::Fulton',\n",
       "  'county::Hamilton',\n",
       "  'county::Jefferson',\n",
       "  'county::Johnston',\n",
       "  'county::Kenosha',\n",
       "  'county::Lemhi',\n",
       "  'county::Los Angeles',\n",
       "  'county::Merced',\n",
       "  'county::Queens',\n",
       "  'county::Richmond City',\n",
       "  'county::West Baton Rouge'],\n",
       " 'county+1': ['county::Alachua',\n",
       "  'county::Allegan',\n",
       "  'county::Androscoggin',\n",
       "  'county::Bay',\n",
       "  'county::Bell',\n",
       "  'county::Belmont',\n",
       "  'county::Bexar',\n",
       "  'county::Blount',\n",
       "  'county::Bristol City',\n",
       "  'county::Bronx',\n",
       "  'county::Burleigh',\n",
       "  'county::Calcasieu',\n",
       "  'county::Carter',\n",
       "  'county::Chatham',\n",
       "  'county::Chittenden',\n",
       "  'county::Clarke',\n",
       "  'county::Colusa',\n",
       "  'county::Cumberland',\n",
       "  'county::DeSoto',\n",
       "  'county::District of Columbia',\n",
       "  'county::Douglas',\n",
       "  'county::Durham',\n",
       "  'county::Floyd',\n",
       "  'county::Franklin',\n",
       "  'county::Galveston',\n",
       "  'county::Genesee',\n",
       "  'county::Glynn',\n",
       "  'county::Hampton City',\n",
       "  'county::Hancock',\n",
       "  'county::Harrison',\n",
       "  'county::Henrico',\n",
       "  'county::Howard',\n",
       "  'county::Johnson',\n",
       "  'county::Lawrence',\n",
       "  'county::Lorain',\n",
       "  'county::McHenry',\n",
       "  'county::Mitchell',\n",
       "  'county::Muscogee',\n",
       "  'county::New Haven',\n",
       "  'county::New London',\n",
       "  'county::Palm Beach',\n",
       "  'county::Palo Alto',\n",
       "  'county::Park',\n",
       "  'county::Penobscot',\n",
       "  'county::Perry',\n",
       "  'county::Philadelphia',\n",
       "  'county::Pike',\n",
       "  'county::Pima',\n",
       "  'county::Pinellas',\n",
       "  'county::Pittsburg',\n",
       "  'county::Portage',\n",
       "  'county::Porter',\n",
       "  'county::Preble',\n",
       "  'county::Providence',\n",
       "  'county::Salem City',\n",
       "  'county::Salt Lake',\n",
       "  'county::Seminole',\n",
       "  'county::Spartanburg',\n",
       "  'county::Spencer',\n",
       "  'county::St. Joseph',\n",
       "  'county::Summit',\n",
       "  'county::Sweetwater',\n",
       "  'county::Tangipahoa',\n",
       "  'county::Terrebonne',\n",
       "  'county::Volusia',\n",
       "  'county::Warren',\n",
       "  'county::Washington',\n",
       "  'county::Washoe',\n",
       "  'county::Whitley',\n",
       "  'county::Worcester'],\n",
       " 'county+2': ['county::Albany',\n",
       "  'county::Albemarle',\n",
       "  'county::Allen',\n",
       "  'county::Anoka',\n",
       "  'county::Ashley',\n",
       "  'county::Baldwin',\n",
       "  'county::Baltimore',\n",
       "  'county::Baltimore (City)',\n",
       "  'county::Bayamon',\n",
       "  'county::Beaver',\n",
       "  'county::Benton',\n",
       "  'county::Berkeley',\n",
       "  'county::Berkshire',\n",
       "  'county::Berrien',\n",
       "  'county::Bibb',\n",
       "  'county::Boulder',\n",
       "  'county::Bowie',\n",
       "  'county::Brown',\n",
       "  'county::Butte',\n",
       "  'county::Cache',\n",
       "  'county::Camden',\n",
       "  'county::Canyon',\n",
       "  'county::Chautauqua',\n",
       "  'county::Clay',\n",
       "  'county::Clayton',\n",
       "  'county::Clinton',\n",
       "  'county::Colbert',\n",
       "  'county::Cook',\n",
       "  'county::Crittenden',\n",
       "  'county::Crook',\n",
       "  'county::Cuyahoga',\n",
       "  'county::Dakota',\n",
       "  'county::Dallas',\n",
       "  'county::Dauphin',\n",
       "  'county::Davis',\n",
       "  'county::DeKalb',\n",
       "  'county::Dodge',\n",
       "  'county::Dubois',\n",
       "  'county::East Baton Rouge',\n",
       "  'county::El Paso',\n",
       "  'county::Escambia',\n",
       "  'county::Etowah',\n",
       "  'county::Forrest',\n",
       "  'county::Forsyth',\n",
       "  'county::Garland',\n",
       "  'county::Guaynabo',\n",
       "  'county::Hennepin',\n",
       "  'county::Houston',\n",
       "  'county::Hudson',\n",
       "  'county::Ingham',\n",
       "  'county::Jackson',\n",
       "  'county::Kalamazoo',\n",
       "  'county::Kane',\n",
       "  'county::Le Flore',\n",
       "  'county::Lee',\n",
       "  'county::Leon',\n",
       "  'county::Lexington',\n",
       "  'county::Macomb',\n",
       "  'county::Madison',\n",
       "  'county::Mahoning',\n",
       "  'county::Maricopa',\n",
       "  'county::Marion',\n",
       "  'county::McCracken',\n",
       "  'county::Mecklenburg',\n",
       "  'county::Minnehaha',\n",
       "  'county::Mono',\n",
       "  'county::New Castle',\n",
       "  'county::Oakland',\n",
       "  'county::Ohio',\n",
       "  'county::Olmsted',\n",
       "  'county::Orange',\n",
       "  'county::Ouachita',\n",
       "  'county::Oxford',\n",
       "  'county::Polk',\n",
       "  \"county::Prince George's\",\n",
       "  'county::Rapides',\n",
       "  'county::Rockingham',\n",
       "  'county::Sacramento',\n",
       "  'county::Sedgwick',\n",
       "  'county::Sequoyah',\n",
       "  'county::Shelby',\n",
       "  'county::Sheridan',\n",
       "  'county::Shoshone',\n",
       "  'county::St. Clair',\n",
       "  'county::Stanislaus',\n",
       "  'county::Steuben',\n",
       "  'county::Suffolk',\n",
       "  'county::Sussex',\n",
       "  'county::Sutter',\n",
       "  'county::Tarrant',\n",
       "  'county::Tippecanoe',\n",
       "  'county::Trumbull',\n",
       "  'county::Tuscaloosa',\n",
       "  'county::Vigo',\n",
       "  'county::Virginia Beach City',\n",
       "  'county::Waukesha',\n",
       "  'county::Weld',\n",
       "  'county::Yakima',\n",
       "  'county::Yolo'],\n",
       " 'county+3': ['county::Adjuntas',\n",
       "  'county::Apache',\n",
       "  'county::Arkansas',\n",
       "  'county::Atlantic',\n",
       "  'county::Bartholomew',\n",
       "  'county::Belknap',\n",
       "  'county::Berks',\n",
       "  'county::Bernalillo',\n",
       "  'county::Boyd',\n",
       "  'county::Bristol',\n",
       "  'county::Carson City',\n",
       "  'county::Champaign',\n",
       "  'county::Chester',\n",
       "  'county::Coffee',\n",
       "  'county::Essex',\n",
       "  'county::Gloucester',\n",
       "  'county::Greenville',\n",
       "  'county::Hampden',\n",
       "  'county::Hawaii',\n",
       "  'county::Henry',\n",
       "  'county::Hillsborough',\n",
       "  'county::Honolulu',\n",
       "  'county::Humboldt',\n",
       "  'county::Inyo',\n",
       "  'county::Juneau ',\n",
       "  'county::Kanawha',\n",
       "  'county::Kent',\n",
       "  'county::LaPorte',\n",
       "  'county::Laramie',\n",
       "  'county::Lewis and Clark',\n",
       "  'county::Litchfield',\n",
       "  'county::Lynchburg City',\n",
       "  'county::Manistee',\n",
       "  'county::Matanuska-Susitna ',\n",
       "  'county::Middlesex',\n",
       "  'county::Missaukee',\n",
       "  'county::Monterey',\n",
       "  'county::Montgomery',\n",
       "  'county::Morgan',\n",
       "  'county::Multnomah',\n",
       "  'county::Nevada',\n",
       "  'county::Ocean',\n",
       "  'county::Pennington',\n",
       "  'county::Ponce',\n",
       "  'county::Pueblo',\n",
       "  'county::Scioto',\n",
       "  'county::Shasta',\n",
       "  'county::Teton'],\n",
       " 'county+4': ['county::Benewah'],\n",
       " 'county+5': ['county::Brooke',\n",
       "  'county::Christian',\n",
       "  'county::Cobb',\n",
       "  'county::Elkhart',\n",
       "  'county::Erie',\n",
       "  'county::Fajardo',\n",
       "  'county::Fayette',\n",
       "  'county::Frederick',\n",
       "  'county::Fremont',\n",
       "  'county::Greene',\n",
       "  'county::Gwinnett',\n",
       "  'county::Harris',\n",
       "  'county::Hartford',\n",
       "  'county::Hidalgo',\n",
       "  'county::Imperial',\n",
       "  'county::Josephine',\n",
       "  'county::Klamath',\n",
       "  'county::Lebanon',\n",
       "  'county::Linn',\n",
       "  'county::Madera',\n",
       "  'county::Marshall',\n",
       "  'county::Milwaukee',\n",
       "  'county::Mobile',\n",
       "  'county::Monroe',\n",
       "  'county::Morris',\n",
       "  'county::Neosho',\n",
       "  'county::Pinal',\n",
       "  'county::Placer',\n",
       "  'county::Pulaski',\n",
       "  'county::Richmond',\n",
       "  'county::Russell',\n",
       "  'county::Saint Clair',\n",
       "  'county::San Bernardino',\n",
       "  'county::Santa Cruz',\n",
       "  'county::Sauk',\n",
       "  'county::Silver Bow',\n",
       "  'county::St. Bernard',\n",
       "  'county::Sullivan',\n",
       "  'county::Talladega',\n",
       "  'county::Union',\n",
       "  'county::Wake',\n",
       "  'county::Walker',\n",
       "  'county::Washtenaw',\n",
       "  'county::Wayne',\n",
       "  'county::Wyandotte'],\n",
       " 'county+6': ['county::Allegheny',\n",
       "  'county::Arapahoe',\n",
       "  'county::Arlington',\n",
       "  'county::Aroostook',\n",
       "  'county::Athens',\n",
       "  'county::Bergen',\n",
       "  'county::Black Hawk',\n",
       "  'county::Box Elder',\n",
       "  'county::Brevard',\n",
       "  'county::Broward',\n",
       "  'county::Buncombe',\n",
       "  'county::Cabell',\n",
       "  'county::Caguas',\n",
       "  'county::Campbell',\n",
       "  'county::Catawba',\n",
       "  'county::Charles',\n",
       "  'county::Charleston',\n",
       "  'county::Cheshire',\n",
       "  'county::Chesterfield',\n",
       "  'county::Clark',\n",
       "  'county::Delaware',\n",
       "  'county::Denver',\n",
       "  'county::Dougherty',\n",
       "  'county::Edgefield',\n",
       "  'county::Ellis',\n",
       "  'county::Fairfield',\n",
       "  'county::Florence',\n",
       "  'county::Grenada',\n",
       "  'county::Hall',\n",
       "  'county::Hardin',\n",
       "  'county::Harney',\n",
       "  'county::Hinds',\n",
       "  'county::Iberville',\n",
       "  'county::Kennebec',\n",
       "  'county::Kern',\n",
       "  'county::King',\n",
       "  'county::Knox',\n",
       "  'county::Lafayette',\n",
       "  'county::Lake',\n",
       "  'county::Lane',\n",
       "  'county::Lenawee',\n",
       "  'county::Loudoun',\n",
       "  'county::Lowndes',\n",
       "  'county::Lucas',\n",
       "  'county::Medina',\n",
       "  'county::Mercer',\n",
       "  'county::Miami-Dade',\n",
       "  'county::Monongalia',\n",
       "  'county::Muscatine',\n",
       "  'county::Natrona',\n",
       "  'county::Norfolk City',\n",
       "  'county::Northampton',\n",
       "  'county::Nueces',\n",
       "  'county::Oklahoma',\n",
       "  'county::Onondaga',\n",
       "  'county::Orleans',\n",
       "  'county::Ottawa',\n",
       "  'county::Passaic',\n",
       "  'county::Pierce',\n",
       "  'county::Pitt',\n",
       "  'county::Plymouth',\n",
       "  'county::Pottawattamie',\n",
       "  'county::Ramsey',\n",
       "  'county::Richland',\n",
       "  'county::Riverside',\n",
       "  'county::Roanoke',\n",
       "  'county::Rutland',\n",
       "  'county::Saint Louis',\n",
       "  'county::San Diego',\n",
       "  'county::Santa Clara',\n",
       "  'county::Sarasota',\n",
       "  'county::Scott',\n",
       "  'county::Scotts Bluff',\n",
       "  'county::St. Louis City',\n",
       "  'county::Stark',\n",
       "  'county::Sumner',\n",
       "  'county::Tooele',\n",
       "  'county::Travis',\n",
       "  'county::Tulsa',\n",
       "  'county::Utah',\n",
       "  'county::Van Buren',\n",
       "  'county::Vanderburgh',\n",
       "  'county::Weber',\n",
       "  'county::Will',\n",
       "  'county::Winnebago',\n",
       "  'county::Wood',\n",
       "  'county::Woodbury'],\n",
       " 'county+7': ['county::Adams',\n",
       "  'county::Caddo',\n",
       "  'county::Fairbanks North Star ',\n",
       "  'county::Fresno',\n",
       "  'county::Henderson',\n",
       "  'county::Kings',\n",
       "  'county::La Crosse',\n",
       "  'county::Lancaster',\n",
       "  'county::New York',\n",
       "  'county::Plumas',\n",
       "  'county::Tulare'],\n",
       " 'city+0': ['city::Alexandria',\n",
       "  'city::Bountiful',\n",
       "  'city::Burns',\n",
       "  'city::Chula Vista',\n",
       "  'city::Evansville',\n",
       "  'city::Hendersonville',\n",
       "  'city::Hickory',\n",
       "  'city::Highland Heights',\n",
       "  'city::Jackson',\n",
       "  'city::Joliet',\n",
       "  'city::Knoxville',\n",
       "  'city::Lafayette',\n",
       "  'city::Lakeview',\n",
       "  'city::Lansing',\n",
       "  'city::Lima',\n",
       "  'city::Memphis',\n",
       "  'city::Mission',\n",
       "  'city::Newburgh',\n",
       "  'city::Oak Park',\n",
       "  'city::Port Huron',\n",
       "  'city::Portsmouth',\n",
       "  'city::Providence',\n",
       "  'city::Provo',\n",
       "  'city::Rochester',\n",
       "  'city::Roland',\n",
       "  'city::Rumford (census name for Rumford Compact)',\n",
       "  'city::Salt Lake City',\n",
       "  'city::San Jose',\n",
       "  'city::Seaford',\n",
       "  'city::Smithfield',\n",
       "  'city::Smiths Grove',\n",
       "  'city::St. Gabriel',\n",
       "  'city::St. Louis Park',\n",
       "  'city::St. Paul',\n",
       "  'city::Toledo',\n",
       "  'city::Valdosta',\n",
       "  'city::Vienna',\n",
       "  'city::Wichita'],\n",
       " 'city+1': ['city::Commerce City',\n",
       "  'city::Des Moines',\n",
       "  'city::La Crosse',\n",
       "  'city::Mira Loma',\n",
       "  'city::Shreveport'],\n",
       " 'city+2': ['city::Amherst',\n",
       "  'city::Champaign',\n",
       "  'city::East Ridge',\n",
       "  'city::Emmetsburg',\n",
       "  'city::Fort Myers',\n",
       "  'city::Galloway (Township of)',\n",
       "  'city::Laconia',\n",
       "  'city::Leeds',\n",
       "  'city::Lynchburg',\n",
       "  'city::Magna',\n",
       "  'city::McCandless Township',\n",
       "  'city::Michigan City',\n",
       "  'city::Mission Viejo',\n",
       "  'city::New Albany',\n",
       "  'city::Newport',\n",
       "  'city::Pasadena',\n",
       "  'city::Presque Isle',\n",
       "  'city::Salem',\n",
       "  'city::Stuttgart',\n",
       "  'city::Vinton',\n",
       "  'city::Warrensville Heights'],\n",
       " 'city+3': ['city::Bakersfield'],\n",
       " 'city+4': ['city::Austin',\n",
       "  'city::Avalon',\n",
       "  'city::Birmingham',\n",
       "  'city::Chicopee',\n",
       "  'city::Cincinnati',\n",
       "  'city::Cleves',\n",
       "  'city::East Farmingdale',\n",
       "  'city::East Saint Louis',\n",
       "  'city::Greenfield',\n",
       "  'city::Haverhill',\n",
       "  'city::Kennesaw',\n",
       "  'city::Long Beach',\n",
       "  'city::Madawaska (census name for Madawaska Center)',\n",
       "  'city::Oakridge',\n",
       "  'city::Sunrise Manor',\n",
       "  'city::Union City'],\n",
       " 'city+5': ['city::Lakeport', 'city::Lancaster', 'city::Steubenville'],\n",
       " 'city+6': ['city::Brockton',\n",
       "  'city::Casper',\n",
       "  'city::Chattanooga',\n",
       "  'city::Cleveland',\n",
       "  'city::Coconut Creek',\n",
       "  'city::Council Bluffs',\n",
       "  'city::Davenport',\n",
       "  'city::East Greenwich (Township of)',\n",
       "  'city::El Dorado',\n",
       "  'city::Erda',\n",
       "  'city::Fairfield',\n",
       "  'city::Freemansburg',\n",
       "  'city::Gray (Beattieville)',\n",
       "  'city::Greenville',\n",
       "  'city::Grenada',\n",
       "  'city::Homestead',\n",
       "  'city::Huntington',\n",
       "  'city::Jenison',\n",
       "  'city::Keeler',\n",
       "  'city::Lexington',\n",
       "  'city::Lindon',\n",
       "  'city::Muscatine',\n",
       "  'city::North Charleston',\n",
       "  'city::Oklahoma City',\n",
       "  'city::Reseda',\n",
       "  'city::Seattle',\n",
       "  'city::Shadyside',\n",
       "  'city::Tacoma',\n",
       "  'city::Weirton'],\n",
       " 'city+7': ['city::Albuquerque',\n",
       "  'city::Bloomington',\n",
       "  'city::Cornwall',\n",
       "  'city::Cottage Grove',\n",
       "  'city::East Providence',\n",
       "  'city::El Centro',\n",
       "  'city::Nashville',\n",
       "  'city::Nazlini (Trading Post)',\n",
       "  'city::Northbrook',\n",
       "  'city::Painesville',\n",
       "  'city::Pennsauken (Township of)',\n",
       "  'city::Ponce',\n",
       "  'city::Yellow Springs'],\n",
       " 'city+8': ['city::Portola'],\n",
       " 'city+9': ['city::Gary',\n",
       "  'city::Groveton',\n",
       "  'city::Gulfport',\n",
       "  'city::Houston',\n",
       "  'city::Liberty',\n",
       "  'city::Little Rock',\n",
       "  'city::Merced',\n",
       "  'city::Miami',\n",
       "  'city::Ontario'],\n",
       " 'city+10': ['city::Atlantic City',\n",
       "  'city::Boston',\n",
       "  'city::Brunswick',\n",
       "  'city::Carlisle',\n",
       "  'city::Cary',\n",
       "  'city::Chester',\n",
       "  'city::Cheyenne',\n",
       "  'city::Cody',\n",
       "  'city::Daytona Beach',\n",
       "  'city::Delray Beach',\n",
       "  'city::Dentsville (Dents)',\n",
       "  'city::Fishers (corporate name for Fishers Station)',\n",
       "  'city::Hazard',\n",
       "  'city::Hernando',\n",
       "  'city::Holland',\n",
       "  'city::Livonia',\n",
       "  'city::Louisville',\n",
       "  'city::Mena',\n",
       "  'city::New Paris',\n",
       "  'city::Not in a city',\n",
       "  'city::San Antonio',\n",
       "  'city::Spruce Pine',\n",
       "  'city::Worcester',\n",
       "  'city::Wyandotte'],\n",
       " 'city+11': ['city::Beaver Falls',\n",
       "  'city::Chico',\n",
       "  'city::El Cajon',\n",
       "  'city::Hammond',\n",
       "  'city::Hot Springs (Hot Springs National Park)',\n",
       "  'city::Huntsville',\n",
       "  'city::Los Angeles',\n",
       "  'city::Martinsburg',\n",
       "  'city::Pico Rivera',\n",
       "  'city::Sioux Falls',\n",
       "  'city::Springdale',\n",
       "  'city::Terre Haute',\n",
       "  'city::Virginia Beach',\n",
       "  'city::Wheeling',\n",
       "  'city::Winston-Salem',\n",
       "  'city::Woodland',\n",
       "  'city::Yuba City'],\n",
       " 'city+12': ['city::Eugene', 'city::Lincoln', 'city::Londonderry'],\n",
       " 'city+13': ['city::Apache Junction',\n",
       "  'city::Banning',\n",
       "  'city::Big Bear City',\n",
       "  'city::Palm Springs',\n",
       "  'city::Underhill (Town of)'],\n",
       " 'city+14': ['city::Rubidoux', 'city::Stanfield'],\n",
       " 'city+15': ['city::Helena Valley West Central',\n",
       "  'city::Medford',\n",
       "  'city::Montgomery',\n",
       "  'city::Nashville-Davidson (Remainder)',\n",
       "  'city::Newark',\n",
       "  'city::Visalia'],\n",
       " 'city+16': ['city::Adjuntas',\n",
       "  'city::Anthony',\n",
       "  'city::Duluth',\n",
       "  'city::Fairbanks',\n",
       "  'city::Indio',\n",
       "  'city::Kenner',\n",
       "  'city::Loretto',\n",
       "  'city::McDonald',\n",
       "  'city::Roxborough Park'],\n",
       " 'city+17': ['city::Arlington',\n",
       "  'city::Asheville',\n",
       "  'city::Bridgeport',\n",
       "  'city::Brigham City',\n",
       "  'city::Brook Park',\n",
       "  'city::Caguas',\n",
       "  'city::Canton',\n",
       "  'city::Chicago',\n",
       "  'city::Corpus Christi',\n",
       "  'city::Denver',\n",
       "  'city::East Syracuse',\n",
       "  'city::Elgin',\n",
       "  'city::Elizabethtown',\n",
       "  'city::Florence',\n",
       "  'city::Fort Lee',\n",
       "  'city::Franklin',\n",
       "  'city::Harrison Township',\n",
       "  'city::Keene',\n",
       "  'city::Lakeland',\n",
       "  'city::Littleton',\n",
       "  'city::Longmont',\n",
       "  'city::Melbourne',\n",
       "  'city::Midlothian',\n",
       "  'city::Morgantown',\n",
       "  'city::New Orleans',\n",
       "  'city::Norfolk',\n",
       "  'city::North Little Rock',\n",
       "  'city::Paterson',\n",
       "  'city::Portland',\n",
       "  'city::Richmond',\n",
       "  'city::Ridge Wood Heights',\n",
       "  'city::Rockford',\n",
       "  'city::Rutland',\n",
       "  'city::Sandersville',\n",
       "  'city::Scottsbluff',\n",
       "  'city::Scottsdale',\n",
       "  'city::Shakopee',\n",
       "  'city::Sioux City',\n",
       "  'city::St. Louis',\n",
       "  'city::Summit',\n",
       "  'city::Tecumseh',\n",
       "  'city::Trenton',\n",
       "  'city::Tualatin',\n",
       "  'city::Tulsa',\n",
       "  'city::Waterloo'],\n",
       " 'city+18': ['city::Buffalo',\n",
       "  'city::Camden',\n",
       "  'city::Dearborn',\n",
       "  'city::Dothan',\n",
       "  'city::East Chicago',\n",
       "  'city::Iowa City',\n",
       "  'city::Jacksonville',\n",
       "  'city::Ladue',\n",
       "  'city::Las Vegas',\n",
       "  'city::Madison',\n",
       "  'city::Newburgh Heights',\n",
       "  'city::San Bernardino',\n",
       "  'city::Waterbury'],\n",
       " 'city+19': ['city::Ashland',\n",
       "  'city::Carson City',\n",
       "  'city::Clearwater',\n",
       "  'city::East Brunswick (Township of)',\n",
       "  'city::Fall River',\n",
       "  'city::Harrisville',\n",
       "  'city::Juneau',\n",
       "  'city::Manistee',\n",
       "  'city::Pascagoula',\n",
       "  'city::Pueblo',\n",
       "  'city::Quincy',\n",
       "  'city::Rapid City',\n",
       "  'city::Redding',\n",
       "  'city::Toms River',\n",
       "  'city::Warner Robins'],\n",
       " 'city+20': ['city::Allen Park',\n",
       "  'city::Apple Valley',\n",
       "  'city::Augusta',\n",
       "  'city::Azusa',\n",
       "  'city::Baton Rouge',\n",
       "  'city::Bayamon',\n",
       "  'city::Beltsville',\n",
       "  'city::Blue Ash',\n",
       "  'city::Cicero',\n",
       "  'city::Coloma',\n",
       "  'city::Dallas',\n",
       "  'city::Danbury',\n",
       "  'city::Detroit',\n",
       "  'city::El Paso',\n",
       "  'city::Forest Park',\n",
       "  'city::Fort Wayne',\n",
       "  'city::Fort Worth',\n",
       "  'city::Hartford',\n",
       "  'city::Hattiesburg',\n",
       "  'city::Macon',\n",
       "  'city::Mammoth Lakes',\n",
       "  'city::Minneapolis',\n",
       "  'city::Pittsburgh',\n",
       "  'city::Pittsfield',\n",
       "  'city::Sheridan',\n",
       "  'city::South Charleston',\n",
       "  'city::Spanish Fork',\n",
       "  'city::Tuscaloosa',\n",
       "  'city::Wood River',\n",
       "  'city::Yakima'],\n",
       " 'city+21': ['city::Corcoran'],\n",
       " 'city+22': ['city::Butte-Silver Bow (Remainder)',\n",
       "  'city::Chickasaw',\n",
       "  'city::Dover',\n",
       "  'city::Edinburg',\n",
       "  'city::Elkhart',\n",
       "  'city::Grand Rapids',\n",
       "  'city::Jeffersonville',\n",
       "  'city::Lexington-Fayette (corporate name for Lexington)',\n",
       "  'city::Middletown',\n",
       "  'city::Moundsville',\n",
       "  'city::Raleigh',\n",
       "  'city::Roseville',\n",
       "  'city::Saint Petersburg',\n",
       "  'city::Ypsilanti'],\n",
       " 'city+23': ['city::Blair',\n",
       "  'city::Carmel',\n",
       "  'city::Cedar Rapids',\n",
       "  'city::Columbus',\n",
       "  'city::Dayton',\n",
       "  'city::Fontana',\n",
       "  'city::Grants Pass',\n",
       "  'city::Green Bay',\n",
       "  'city::Indianapolis (Remainder)',\n",
       "  'city::Ironton',\n",
       "  'city::Keokuk',\n",
       "  'city::Lander',\n",
       "  'city::Milwaukee',\n",
       "  'city::Pawtucket',\n",
       "  'city::Pompano Beach Highlands',\n",
       "  'city::Schiller Park',\n",
       "  'city::Springfield'],\n",
       " 'city+24': ['city::Albany',\n",
       "  'city::Altamont',\n",
       "  'city::Arden-Arcade',\n",
       "  'city::Boulder',\n",
       "  'city::Chalmette',\n",
       "  'city::Charleroi',\n",
       "  'city::Childersburg',\n",
       "  'city::Clarksburg',\n",
       "  'city::Compton',\n",
       "  'city::East Hartford',\n",
       "  'city::Elizabeth',\n",
       "  'city::Follansbee',\n",
       "  'city::Gadsden',\n",
       "  'city::Kansas City',\n",
       "  'city::Madera',\n",
       "  'city::Nogales',\n",
       "  'city::North Braddock',\n",
       "  'city::Pinehurst (Pine Creek)',\n",
       "  'city::Platteville',\n",
       "  'city::Warren',\n",
       "  'city::Wilmington'],\n",
       " 'city+25': ['city::Anderson',\n",
       "  'city::Hillsboro',\n",
       "  'city::New Haven',\n",
       "  'city::Peterborough (Peterboro)',\n",
       "  'city::Preston'],\n",
       " 'city+26': ['city::Akron',\n",
       "  'city::Alsip',\n",
       "  'city::Alton',\n",
       "  'city::Athens (corp name Athens-Clarke County)',\n",
       "  'city::Bangor',\n",
       "  'city::Bay City',\n",
       "  'city::Bismarck',\n",
       "  'city::Bondville',\n",
       "  'city::Bristol',\n",
       "  'city::Clairton',\n",
       "  'city::Colusa',\n",
       "  'city::Dale',\n",
       "  'city::Decatur',\n",
       "  'city::Deer Park',\n",
       "  'city::Durham',\n",
       "  'city::Gainesville',\n",
       "  'city::Garden City',\n",
       "  'city::Grass Valley',\n",
       "  'city::Hampton',\n",
       "  'city::Jersey City',\n",
       "  'city::Kokomo',\n",
       "  'city::Laramie',\n",
       "  'city::McAlester',\n",
       "  'city::Philadelphia',\n",
       "  'city::Pikeville',\n",
       "  'city::Rock Springs',\n",
       "  'city::Sacramento',\n",
       "  'city::Sanford',\n",
       "  'city::Sheffield',\n",
       "  'city::Somerset',\n",
       "  'city::South Bend',\n",
       "  'city::Tucson'],\n",
       " 'city+27': ['city::Aurora',\n",
       "  'city::Baltimore',\n",
       "  'city::Bella Vista',\n",
       "  'city::Blaine',\n",
       "  'city::Casa Grande',\n",
       "  'city::Charlotte',\n",
       "  'city::Cheektowaga',\n",
       "  'city::Clinton',\n",
       "  'city::Crossett',\n",
       "  'city::Dunkirk',\n",
       "  'city::Fairhope',\n",
       "  'city::Ferry Pass',\n",
       "  'city::Guaynabo',\n",
       "  'city::Horicon',\n",
       "  'city::Jasper',\n",
       "  'city::Kalamazoo',\n",
       "  'city::Marion',\n",
       "  'city::Mingo Junction',\n",
       "  'city::Modesto',\n",
       "  'city::Monroe',\n",
       "  'city::Muscle Shoals',\n",
       "  'city::Nampa',\n",
       "  'city::Overland Park',\n",
       "  'city::Paducah',\n",
       "  'city::Phoenix',\n",
       "  'city::Prineville',\n",
       "  'city::Rahway',\n",
       "  'city::Seven Oaks',\n",
       "  'city::South Valley',\n",
       "  'city::Tallahassee',\n",
       "  'city::Texarkana',\n",
       "  'city::Waukesha',\n",
       "  'city::Youngstown'],\n",
       " 'city+28': ['city::Brawley',\n",
       "  'city::Davie',\n",
       "  'city::Fairmont',\n",
       "  'city::Fayetteville',\n",
       "  'city::Flint',\n",
       "  'city::Galveston',\n",
       "  'city::Grand Island',\n",
       "  'city::Groton',\n",
       "  'city::Knowlton (Township of)',\n",
       "  'city::Lewiston',\n",
       "  'city::Maryville',\n",
       "  'city::Middlesborough (corporate name for Middlesboro)',\n",
       "  'city::Muncie',\n",
       "  'city::Ogden Dunes (Wickliffe)',\n",
       "  'city::Ravenna',\n",
       "  'city::Reno',\n",
       "  'city::San Diego',\n",
       "  'city::Simpsonville',\n",
       "  'city::Spartanburg',\n",
       "  'city::Washington'],\n",
       " 'city+29': ['city::Charleston',\n",
       "  'city::Clive',\n",
       "  'city::Crossville',\n",
       "  'city::Hilo',\n",
       "  'city::Marrero',\n",
       "  'city::Palm Springs North',\n",
       "  'city::Salinas',\n",
       "  'city::Truckee'],\n",
       " 'city+30': ['city::Anaheim',\n",
       "  'city::Atlanta',\n",
       "  'city::Clovis',\n",
       "  'city::East Highland Park',\n",
       "  'city::Essex',\n",
       "  'city::Fresno',\n",
       "  'city::Granite City',\n",
       "  'city::McCook',\n",
       "  'city::New York',\n",
       "  'city::Ogden',\n",
       "  'city::Omaha',\n",
       "  'city::Phenix City',\n",
       "  'city::Pleasant Prairie',\n",
       "  'city::Valrico',\n",
       "  'city::Waveland'],\n",
       " 'city+31': ['city::Calexico', 'city::Eureka'],\n",
       " 'date_local_month+0': ['date_local_month::7', 'date_local_month::12'],\n",
       " 'date_local_month+1': ['date_local_month::5'],\n",
       " 'date_local_month+2': ['date_local_month::6'],\n",
       " 'date_local_month+3': ['date_local_month::9'],\n",
       " 'date_local_month+4': ['date_local_month::4'],\n",
       " 'date_local_month+5': ['date_local_month::11'],\n",
       " 'date_local_month+6': ['date_local_month::2'],\n",
       " 'date_local_month+7': ['date_local_month::3'],\n",
       " 'date_local_month+8': ['date_local_month::10'],\n",
       " 'date_local_month+9': ['date_local_month::8']}"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cluster_groups[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f51cf3a0-d966-4cb3-8aad-b7caec2a538f",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "589eabac-c8af-4a29-b738-5f805d2dc954",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "82ed1812-b347-40d5-b629-e9af49b7e4fd",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d68109a4-bc8c-4827-addb-4e4d11762869",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a39070f0-af7a-4aca-a8a2-a59092e593e6",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.13.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
