{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "initial_id",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-05-22T07:41:03.562265Z",
     "start_time": "2024-05-22T07:41:03.559003Z"
    }
   },
   "outputs": [],
   "source": [
    "# Third Party Imports\n",
    "import matplotlib.pyplot as plt\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "from sklearn.metrics import accuracy_score\n",
    "from sklearn.model_selection import train_test_split, RandomizedSearchCV\n",
    "from sklearn.neighbors import KNeighborsClassifier\n",
    "from sklearn.preprocessing import StandardScaler"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "644fbcb1-a948-4036-8fec-6f18369ec046",
   "metadata": {},
   "source": [
    "#### Data Preparation"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "bc9ca94d-fd7a-46c5-932d-01ca644994c9",
   "metadata": {},
   "source": [
    "**Reading the Blood Transfusion Dataset**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "77cb6a91a07ed68d",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-05-22T07:41:03.731947Z",
     "start_time": "2024-05-22T07:41:03.723709Z"
    }
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Recency (months)</th>\n",
       "      <th>Frequency (times)</th>\n",
       "      <th>Monetary (c.c. blood)</th>\n",
       "      <th>Time (months)</th>\n",
       "      <th>Blood Donated</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2</td>\n",
       "      <td>50</td>\n",
       "      <td>12500</td>\n",
       "      <td>98</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0</td>\n",
       "      <td>13</td>\n",
       "      <td>3250</td>\n",
       "      <td>28</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1</td>\n",
       "      <td>16</td>\n",
       "      <td>4000</td>\n",
       "      <td>35</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2</td>\n",
       "      <td>20</td>\n",
       "      <td>5000</td>\n",
       "      <td>45</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1</td>\n",
       "      <td>24</td>\n",
       "      <td>6000</td>\n",
       "      <td>77</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Recency (months)  Frequency (times)  Monetary (c.c. blood)  Time (months)  \\\n",
       "0                 2                 50                  12500             98   \n",
       "1                 0                 13                   3250             28   \n",
       "2                 1                 16                   4000             35   \n",
       "3                 2                 20                   5000             45   \n",
       "4                 1                 24                   6000             77   \n",
       "\n",
       "   Blood Donated  \n",
       "0              1  \n",
       "1              1  \n",
       "2              1  \n",
       "3              1  \n",
       "4              0  "
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Reading the Blood Dataset\n",
    "blood = pd.read_csv(\"./../../../datasets/blood/blood.data\")\n",
    "blood.head()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "317ecda9-87df-40b3-918d-19b7ccd05777",
   "metadata": {},
   "source": [
    "**Print Info and Missing Values**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "1b167864-ced8-46fd-89d8-74266115ab90",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'pandas.core.frame.DataFrame'>\n",
      "RangeIndex: 748 entries, 0 to 747\n",
      "Data columns (total 5 columns):\n",
      " #   Column                 Non-Null Count  Dtype\n",
      "---  ------                 --------------  -----\n",
      " 0   Recency (months)       748 non-null    int64\n",
      " 1   Frequency (times)      748 non-null    int64\n",
      " 2   Monetary (c.c. blood)  748 non-null    int64\n",
      " 3   Time (months)          748 non-null    int64\n",
      " 4   Blood Donated          748 non-null    int64\n",
      "dtypes: int64(5)\n",
      "memory usage: 29.3 KB\n",
      "None\n",
      "\n",
      "\n",
      "\n",
      "Missing values:  False\n"
     ]
    }
   ],
   "source": [
    "print(blood.info())\n",
    "print(\"\\n\\n\")\n",
    "print(\"Missing values: \", blood.isnull().values.any())"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "d921143a-172f-4f29-80c6-5a877643d067",
   "metadata": {},
   "source": [
    "**Variance Check**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "948672e3-370b-466e-97ac-be927c47d05f",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Recency (months)              65.535\n",
       "Frequency (times)             34.098\n",
       "Monetary (c.c. blood)    2131094.230\n",
       "Time (months)                594.224\n",
       "Blood Donated                  0.182\n",
       "dtype: float64"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "blood.var().round(3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "a9aaeed7-a7e6-4fac-83fb-213f6b0c3774",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Recency (months)</th>\n",
       "      <th>Frequency (times)</th>\n",
       "      <th>Monetary (c.c. blood)</th>\n",
       "      <th>Time (months)</th>\n",
       "      <th>Blood Donated</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2</td>\n",
       "      <td>50</td>\n",
       "      <td>12500</td>\n",
       "      <td>98</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0</td>\n",
       "      <td>13</td>\n",
       "      <td>3250</td>\n",
       "      <td>28</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1</td>\n",
       "      <td>16</td>\n",
       "      <td>4000</td>\n",
       "      <td>35</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2</td>\n",
       "      <td>20</td>\n",
       "      <td>5000</td>\n",
       "      <td>45</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1</td>\n",
       "      <td>24</td>\n",
       "      <td>6000</td>\n",
       "      <td>77</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Recency (months)  Frequency (times)  Monetary (c.c. blood)  Time (months)  \\\n",
       "0                 2                 50                  12500             98   \n",
       "1                 0                 13                   3250             28   \n",
       "2                 1                 16                   4000             35   \n",
       "3                 2                 20                   5000             45   \n",
       "4                 1                 24                   6000             77   \n",
       "\n",
       "   Blood Donated  \n",
       "0              1  \n",
       "1              1  \n",
       "2              1  \n",
       "3              1  \n",
       "4              0  "
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "blood.head()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "06776d06-aac3-4cd8-b1e8-b8498381d713",
   "metadata": {},
   "source": [
    "**Checking the distribution of target values**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "339d9bbe-8754-4572-87e1-3365bed7af5e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Blood Donated\n",
       "0    0.762\n",
       "1    0.238\n",
       "Name: proportion, dtype: float64"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "blood[\"Blood Donated\"].value_counts(normalize=True).round(3)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0ce86e3c-d237-459e-805b-83a02b971354",
   "metadata": {},
   "source": [
    "**Train-Test Split**"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "852899ac-5378-4914-a9e7-c206ded4d0de",
   "metadata": {},
   "source": [
    "Train - Test Split &nbsp;&nbsp;&nbsp;&nbsp; 60%-40%\n",
    "\n",
    "The Test-Set is Further split into Verb And Gen split\n",
    "\n",
    "Verb - Gen Split   &nbsp;&nbsp;&nbsp;&nbsp; 50%-50%"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "bf7ff54f-f3f4-40e6-8bc4-424d99ae8af8",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Train Test Split Stratified on Target Feature\n",
    "X_train, X_test, y_train, y_test = train_test_split(blood.drop(columns=\"Blood Donated\"), blood[\"Blood Donated\"], test_size=0.4, random_state=400, stratify=blood[\"Blood Donated\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "5cc4deea-e333-4ce0-890d-ad1078aac260",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Train Test Split on the Test set to get Verb and Gen Sets. Stratified on the Target Feature\n",
    "X_test_verb, X_test_gen, y_test_verb, y_test_gen = train_test_split(X_test, y_test, test_size=0.5, random_state=400, stratify=y_test)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "bda17883-3302-4fc9-8b3b-46c6c669a070",
   "metadata": {},
   "source": [
    "**Checking the distribution target values after the split**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "f79613d4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Blood Donated\n",
      "0    0.761\n",
      "1    0.239\n",
      "Name: proportion, dtype: float64\n",
      "Blood Donated\n",
      "0    0.76\n",
      "1    0.24\n",
      "Name: proportion, dtype: float64\n",
      "Blood Donated\n",
      "0    0.767\n",
      "1    0.233\n",
      "Name: proportion, dtype: float64\n"
     ]
    }
   ],
   "source": [
    "print(y_train.value_counts(normalize=True).round(3))\n",
    "print(y_test_verb.value_counts(normalize=True).round(3))\n",
    "print(y_test_gen.value_counts(normalize=True).round(3))"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "ccf6c676-335d-4133-afa2-5161bd932f2a",
   "metadata": {},
   "source": [
    "**Variance Check**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "9bf865bb-067e-40f8-bfb8-03afba7c71a1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Recency (months)              71.826\n",
       "Frequency (times)             38.962\n",
       "Monetary (c.c. blood)    2435111.807\n",
       "Time (months)                569.385\n",
       "dtype: float64"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "X_train.var().round(3)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0a7a2750-30fc-45f5-97d9-9bd0863cab60",
   "metadata": {},
   "source": [
    "**Standardization** - Skipping this because the resulting dataset has very high precision float values (that may not be good for the LLM)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "ebbccb2f-d31e-451c-83a4-ba3b35025796",
   "metadata": {},
   "outputs": [],
   "source": [
    "scaler = StandardScaler()\n",
    "X_train_scaled = scaler.fit_transform(X_train)\n",
    "X_test_gen_scaled = scaler.transform(X_test_gen)\n",
    "X_test_verb_scaled = scaler.transform(X_test_verb)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "99cb1c0e-8239-4489-a757-51307bfe7e8a",
   "metadata": {},
   "source": [
    "**Converting them back to dataframes** - No need for this now as there's no standardization"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "563a7aff-a958-42bf-a740-bfe04b397aee",
   "metadata": {},
   "outputs": [],
   "source": [
    "X_train_scaled_df = pd.DataFrame(X_train_scaled, columns=X_train.columns)\n",
    "X_test_gen_scaled_df = pd.DataFrame(X_test_gen_scaled, columns=X_test.columns)\n",
    "X_test_verb_scaled_df = pd.DataFrame(X_test_verb_scaled, columns=X_test.columns)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "d53928be",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Recency (months)         1.00224\n",
       "Frequency (times)        1.00224\n",
       "Monetary (c.c. blood)    1.00224\n",
       "Time (months)            1.00224\n",
       "dtype: float64"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "X_train_scaled_df.var().round(5)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "d4ad7b6d-4c4a-47bb-998d-f1b1c7b27c46",
   "metadata": {},
   "source": [
    "Let's expand the dataset. This will preserve the relationship between the data points but since the data is scaled, it'll be easier for the LLM to interpret"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "92893c0c-a9aa-4620-bd7a-fdf3e007561b",
   "metadata": {},
   "outputs": [],
   "source": [
    "expansion_factor = 100\n",
    "X_train_scaled_df = X_train_scaled_df * expansion_factor\n",
    "X_test_verb_scaled_df = X_test_verb_scaled_df * expansion_factor\n",
    "X_test_gen_scaled_df = X_test_gen_scaled_df * expansion_factor"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "61360c87-a38f-4ec7-a771-5fe734bb6f79",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Recency (months)         10022.37136\n",
       "Frequency (times)        10022.37136\n",
       "Monetary (c.c. blood)    10022.37136\n",
       "Time (months)            10022.37136\n",
       "dtype: float64"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "X_train_scaled_df.var().round(5)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "97fe3ae9-5bdc-488c-9339-af497d6999ee",
   "metadata": {},
   "source": [
    "From here Onwards `X_test_verb_scaled_df` is going to be `X_test_scaled_df`. `X_test_gen_scaled_df` is not going to be used at all in the code"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "61841898",
   "metadata": {},
   "outputs": [],
   "source": [
    "X_test_scaled_df = X_test_verb_scaled_df\n",
    "y_test = y_test_verb"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8acd2ecf-4e1c-4ff3-9a3f-8f19b5cd7783",
   "metadata": {},
   "source": [
    "#### Helper Functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "ffb370a1-50a9-404f-9b85-4f8feeb4bd0f",
   "metadata": {},
   "outputs": [],
   "source": [
    "def nearest_neighbours_plot(knn, X_train, y_train, X_test, y_pred, test_index):\n",
    "    # Select a test instance and print the prediction\n",
    "    test_instance = X_test.iloc[test_index]\n",
    "    \n",
    "    # Find the nearest neighbors\n",
    "    distances, indices = knn.kneighbors([test_instance])\n",
    "    \n",
    "    # Indices 0 and 1 correspond to Recency and Frequency\n",
    "    feature_index_1 = 0\n",
    "    feature_index_2 = 1\n",
    "\n",
    "    # Plot the training data\n",
    "    plt.figure(figsize=(10, 6))\n",
    "    plt.scatter(X_train.iloc[:, feature_index_1], X_train.iloc[:, feature_index_2], c=y_train, cmap='viridis', edgecolor='k')\n",
    "    \n",
    "    # Plot the test instance\n",
    "    plt.scatter(test_instance[feature_index_1], test_instance[feature_index_2], c='r', s=100, marker='*', label='Test Instance')\n",
    "    \n",
    "    # Plot the nearest neighbors\n",
    "    nearest_neighbors = X_train.iloc[indices[0]]\n",
    "    plt.scatter(nearest_neighbors.iloc[:, feature_index_1], nearest_neighbors.iloc[:, feature_index_2], c='g', s=100, label=f'k Nearest Neighbors')\n",
    "    \n",
    "    # Add labels and title\n",
    "    plt.xlabel(X_train.columns[0])\n",
    "    plt.ylabel(X_train.columns[1])\n",
    "    plt.title('Nearest Neighbors Plot')\n",
    "    plt.legend()\n",
    "    \n",
    "    plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8b4f0cd4-3251-4f7a-99d4-d12f4c7bc310",
   "metadata": {},
   "source": [
    "#### Model Variations"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "a4d58829-270b-4e57-a66c-e5af096007e4",
   "metadata": {},
   "source": [
    "**Best Parameter**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "fa0140dc-832a-4916-8844-2fc4a16d5dc1",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/shravan/NLE/Explainable-AI/venv/lib/python3.12/site-packages/numpy/ma/core.py:2846: RuntimeWarning: invalid value encountered in cast\n",
      "  _data = np.array(data, dtype=dtype, copy=copy,\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(151)\n",
    "    \n",
    "param_distributions = {\n",
    "    'n_neighbors': range(1, 10),\n",
    "    'weights': ['uniform', 'distance'],\n",
    "    'algorithm': ['auto', 'brute'],\n",
    "    'leaf_size': range(10, 51),\n",
    "    'p': [1, 2, np.inf],\n",
    "    'metric': ['minkowski', 'cosine']\n",
    "}\n",
    "\n",
    "knn = KNeighborsClassifier()\n",
    "random_search = RandomizedSearchCV(\n",
    "    estimator=knn,\n",
    "    param_distributions=param_distributions,\n",
    "    n_iter=10,\n",
    "    cv=5,\n",
    "    n_jobs=-1,\n",
    "    scoring='accuracy',\n",
    "    random_state=21\n",
    ")\n",
    "\n",
    "random_search.fit(X_train_scaled_df, y_train)\n",
    "best_params = random_search.best_params_"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "6958dd86-d485-4998-b663-9fc11fbdba67",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'weights': 'uniform',\n",
       " 'p': 1,\n",
       " 'n_neighbors': 6,\n",
       " 'metric': 'cosine',\n",
       " 'leaf_size': 17,\n",
       " 'algorithm': 'auto'}"
      ]
     },
     "execution_count": 19,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "best_params"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "30088431-0576-483c-adef-d0e5900e78de",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.7533333333333333"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Train the base model\n",
    "def train_base_model(X_train, y_train):\n",
    "    # best_knn = KNeighborsClassifier(**best_params)\n",
    "    best_knn = KNeighborsClassifier(metric=\"minkowski\", n_neighbors=5, p=3)\n",
    "    best_knn.fit(X_train, y_train)\n",
    "    return best_knn\n",
    "\n",
    "base_model = train_base_model(X_train_scaled_df, y_train)\n",
    "base_pred = base_model.predict(X_test_scaled_df)\n",
    "accuracy_score(y_test, base_pred)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0ca95e36-e07e-4695-a25c-11affdbe8d24",
   "metadata": {},
   "outputs": [],
   "source": [
    "def generate_random_params():\n",
    "    metric = np.random.choice(['minkowski', 'cosine'])\n",
    "    \n",
    "    if metric == 'minkowski':\n",
    "        p_choices = [1, 2, 3, 4, np.inf]\n",
    "        p = np.random.choice(p_choices)\n",
    "        params = {\n",
    "            'n_neighbors': np.random.randint(1, 12),\n",
    "            'weights': np.random.choice(['uniform', 'distance']),\n",
    "            'algorithm': np.random.choice(['auto', 'ball_tree', 'kd_tree', 'brute']),\n",
    "            'leaf_size': np.random.randint(10, 51),\n",
    "            'metric': 'minkowski',\n",
    "            'p': p\n",
    "        }\n",
    "    else:  # cosine similarity\n",
    "        params = {\n",
    "            'n_neighbors': np.random.randint(1, 12),\n",
    "            'weights': np.random.choice(['uniform', 'distance']),\n",
    "            'algorithm': 'brute',\n",
    "            'metric': 'cosine'\n",
    "        }\n",
    "    \n",
    "    return params\n",
    "\n",
    "def compare_models(model1, model2, X):\n",
    "    pred1 = model1.predict(X)\n",
    "    pred2 = model2.predict(X)\n",
    "    diff_percentage = np.mean(pred1 != pred2)\n",
    "    return diff_percentage"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6f5b47dd-fd38-4f95-9846-fee1c83e7eac",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Comparison with Base Model\n",
    "def generate_models_with_diff(base_model, X_train, y_train, X_test, max_attempts=10):\n",
    "    best_diff = 0\n",
    "    best_pair = None\n",
    "    all_models = []\n",
    "    \n",
    "    for i in range(max_attempts):\n",
    "        random_params = generate_random_params()\n",
    "        new_model = KNeighborsClassifier(**random_params)\n",
    "        new_model.fit(X_train, y_train)\n",
    "        all_models.append(new_model)\n",
    "        \n",
    "        diff = compare_models(base_model, new_model, X_test)\n",
    "        print(f\"Attempt Number {i}. Diff - {diff}\")\n",
    "        \n",
    "        if diff > best_diff and (0.20 <= diff and diff <= 0.25):\n",
    "            best_diff = diff\n",
    "            best_pair = (base_model, new_model)\n",
    "            print(f\"Best diff till now {best_diff}.\")\n",
    "    return best_pair, best_diff, all_models"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a9c4fc5e-a3c3-4e02-90d5-20d759c5ac89",
   "metadata": {},
   "outputs": [],
   "source": [
    "# np.random.seed(128)\n",
    "# np.random.seed(236)\n",
    "# np.random.seed(264)\n",
    "# np.random.seed(130)\n",
    "# np.random.seed(125)\n",
    "# np.random.seed(400)\n",
    "np.random.seed(440)\n",
    "max_attempts = 50\n",
    "best_pair, best_diff, all_knns = generate_models_with_diff(base_model, X_train_scaled_df, y_train, X_test_scaled_df, max_attempts)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b4de7a2f-1b92-4635-9456-fd625595c80b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def find_best_model_pair(all_models, X_test):\n",
    "    best_pair = None\n",
    "    best_diff = 0\n",
    "    n = len(all_models)\n",
    "    \n",
    "    for i in range(n):\n",
    "        print(f\"ith value is - {i}\")\n",
    "        for j in range(i+1, n):\n",
    "            \n",
    "            model_i = all_models[i]\n",
    "            model_j = all_models[j]\n",
    "            \n",
    "            diff = compare_models(model_i, model_j, X_test)\n",
    "            print(f\"Comparing Model {i} and Model {j}. Diff: {diff:.4f}\")\n",
    "            \n",
    "            if diff > best_diff and (0.20 <= diff and diff <= 0.25):\n",
    "                best_diff = diff\n",
    "                best_pair = (model_i, model_j)\n",
    "                print(\"************************************\")\n",
    "                print(f\"New best pair found: Models {i} and {j} with diff {diff:.4f}\")\n",
    "                print(\"************************************\")\n",
    "               \n",
    "    return best_pair, best_diff"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6e2ccfa6-1437-4cc7-bb4a-570272043034",
   "metadata": {},
   "outputs": [],
   "source": [
    "best_pair, best_diff = find_best_model_pair(all_knns, X_test_scaled_df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b00b7592-1329-4ef7-83a3-aaa8658d506b",
   "metadata": {},
   "outputs": [],
   "source": [
    "model1, model2 = best_pair"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9077d3ed-bc11-4ff7-bdb9-82439a985c16",
   "metadata": {},
   "outputs": [],
   "source": [
    "model2, model1 = best_pair"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a7aa62ed-2203-49ab-b6f0-87f6ab2049aa",
   "metadata": {},
   "outputs": [],
   "source": [
    "# let's check the difference on the generation data as well\n",
    "compare_models(model1, model2, X_test_gen_scaled_df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "dba9bf5b-0b57-4456-ac25-bcccafe00d22",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "id": "9ea03138-8060-44ec-80ba-72d49272ec80",
   "metadata": {},
   "source": [
    "**Evaluate Both Models**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6e595955-68c6-41b3-8b0e-051de7cf86ba",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Evaluate both models\n",
    "y_pred_1 = model1.predict(X_test_scaled_df)\n",
    "y_pred_2 = model2.predict(X_test_scaled_df)\n",
    "\n",
    "accuracy1 = accuracy_score(y_test, y_pred_1)\n",
    "accuracy2 = accuracy_score(y_test, y_pred_2)\n",
    "\n",
    "# Print results\n",
    "print(f\"Model 1\")\n",
    "print(\"Model 1 accuracy:\", accuracy1)\n",
    "print(f\"\\nModel 2:\")\n",
    "print(\"Model 2 accuracy:\", accuracy2)\n",
    "print(\"\\nAccuracy difference:\", abs(accuracy1 - accuracy2))\n",
    "print(f\"\\nPercentage of different outputs: {best_diff:.2%}\")\n",
    "\n",
    "print(\"\\n\\n\")\n",
    "print(model1.get_params())\n",
    "print(model2.get_params())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "170339e7-d051-4934-9bbf-30ae482fd8cf",
   "metadata": {},
   "outputs": [],
   "source": [
    "nearest_neighbours_plot(model1, X_train_scaled_df, y_train, X_test_scaled_df, y_pred_1, 23)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "938c2dc6-cc5a-4492-ae6b-e8e5f2dfb2bf",
   "metadata": {},
   "outputs": [],
   "source": [
    "nearest_neighbours_plot(model2, X_train_scaled_df, y_train, X_test_scaled_df, y_pred_2, 23)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "cd8a30d3-da04-4c7f-953f-a6eec2515698",
   "metadata": {},
   "source": [
    "#### Compare Model Boundaries"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "15fea562-bb74-41a7-a270-87fc65b1fa25",
   "metadata": {},
   "source": [
    "**Plot Model Decision Boundaries**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "80b922f5-4307-452f-90d2-397fc5e969ad",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Function to plot decision boundary\n",
    "def plot_decision_boundary(X_test, y_pred, feature_1, feature_2):\n",
    "    # Create a scatter plot of the predictions\n",
    "    plt.figure(figsize=(8, 6))\n",
    "    plt.scatter(X_test[feature_1], X_test[feature_2], c=y_pred, cmap='rainbow', edgecolor='black', s=20, vmin=0, vmax=1)\n",
    "    \n",
    "    # Add labels and title\n",
    "    plt.xlabel(feature_1)\n",
    "    plt.ylabel(feature_2)\n",
    "    plt.title('KNN Decision Boundary')\n",
    "    \n",
    "    # Add a colorbar to indicate the predicted classes\n",
    "    cbar = plt.colorbar()\n",
    "    cbar.set_ticks([0, 1])\n",
    "    cbar.set_ticklabels([\"No\", \"Yes\"])\n",
    "\n",
    "    plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "6d4d70a4-794b-4bc0-8659-d244baa22e7c",
   "metadata": {},
   "source": [
    "**Model 1 Decision Boundary**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "de4db779-ea88-4543-944d-46c15b3e31de",
   "metadata": {},
   "outputs": [],
   "source": [
    "plot_decision_boundary(X_test_scaled_df, y_pred_1, \"Recency (months)\", \"Frequency (times)\")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "599fcca1-20b3-4b16-89c4-4fba23c314ce",
   "metadata": {},
   "source": [
    "**Model 2 Decision Boundary**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "bff87fe6-d656-416c-88a7-47fd6d503a63",
   "metadata": {},
   "outputs": [],
   "source": [
    "plot_decision_boundary(X_test_scaled_df, y_pred_2, \"Recency (months)\", \"Frequency (times)\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6f04be47-b214-4aa2-a035-57987b4684ae",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "id": "868a325f-d81b-48b4-85a8-5c7f7fc7c201",
   "metadata": {},
   "source": [
    "**Preparing Detailed Data For Ablation Study**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6cbdfedb",
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_knn_details(knn_model, X_train, y_train, X_test, for_gen=False):\n",
    "    if not hasattr(knn_model, 'classes_'):\n",
    "        raise ValueError(\"The KNN model is not fitted. Please fit the model before using this function.\")\n",
    "    \n",
    "    # Get the number of neighbors (k) from the model\n",
    "    k = knn_model.n_neighbors\n",
    "    \n",
    "    result = []\n",
    "    \n",
    "    # Loop through each row in the testing dataset\n",
    "    for _, test_row in X_test.iterrows():\n",
    "        distances, indices = knn_model.kneighbors([test_row], n_neighbors=k)\n",
    "        predicted_output = knn_model.predict([test_row])[0]\n",
    "        \n",
    "        nearest_neighbors = []\n",
    "        for distance, index in zip(distances[0], indices[0]):\n",
    "            neighbor_details = {\n",
    "                \"feature_values\": X_train.iloc[index].tolist(),\n",
    "                \"assigned_class\": int(y_train.iloc[index]),\n",
    "                \"distance\": float(distance)\n",
    "            }\n",
    "            nearest_neighbors.append(neighbor_details)\n",
    "        \n",
    "        # Add k random data points if for_gen is True\n",
    "        if for_gen:\n",
    "            random_indices = np.random.choice(len(X_train), k, replace=False)\n",
    "            for index in random_indices:\n",
    "                random_point_details = {\n",
    "                    \"feature_values\": X_train.iloc[index].tolist(),\n",
    "                    \"assigned_class\": int(y_train.iloc[index]),\n",
    "                    \"distance\": None  # Random data points don't have a distance\n",
    "                }\n",
    "                nearest_neighbors.append(random_point_details)\n",
    "        \n",
    "        # Add the details to the result dictionary\n",
    "        result.append({\n",
    "            \"input\": test_row.tolist(),\n",
    "            \"output\": int(predicted_output),\n",
    "            \"nearest_neighbors\": nearest_neighbors\n",
    "        })\n",
    "        \n",
    "    return result"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b8dc1f25-f56a-47df-9d75-e364be498870",
   "metadata": {},
   "outputs": [],
   "source": [
    "model1_details_verb = get_knn_details(model1, X_train_scaled_df, y_train, X_test_scaled_df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "15784e34-dd83-42e1-b7ae-7f0c61de0a13",
   "metadata": {},
   "outputs": [],
   "source": [
    "model2_details_verb = get_knn_details(model2, X_train_scaled_df, y_train, X_test_scaled_df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ffff2030-daf8-439c-8c2f-d759d7d1e9d6",
   "metadata": {},
   "outputs": [],
   "source": [
    "model1_details_gen = get_knn_details(model1, X_train_scaled_df, y_train, X_test_gen_scaled_df, for_gen=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "49d011df-c937-4922-ba06-e6c35182442c",
   "metadata": {},
   "outputs": [],
   "source": [
    "model2_details_gen = get_knn_details(model2, X_train_scaled_df, y_train, X_test_gen_scaled_df, for_gen=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "134416e9-8e03-4c14-bfc5-d08ec5a45df4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def round_values(data, precision=3):\n",
    "    if isinstance(data, list):\n",
    "        return [round_values(item, precision) for item in data]\n",
    "    elif isinstance(data, dict):\n",
    "        return {key: round_values(value, precision) for key, value in data.items()}\n",
    "    elif isinstance(data, (int, float)):\n",
    "        return round(data, precision)\n",
    "    return data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5971118d-84e4-4688-890b-9f570e4666b4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_combined_details(model1_details, model2_details):\n",
    "    combined_details = []\n",
    "    for m1, m2 in zip(model1_details, model2_details):\n",
    "        if m1['input'] == m2['input']:\n",
    "            rounded_input = round_values(m1['input'])\n",
    "            rounded_nn1 = round_values(m1['nearest_neighbors'])\n",
    "            rounded_nn2 = round_values(m2['nearest_neighbors'])\n",
    "\n",
    "            combined_entry = {\n",
    "                \"input\": rounded_input,\n",
    "                \"model1\": {\n",
    "                    \"output\": m1['output'],\n",
    "                    \"nearest_neighbors\": rounded_nn1\n",
    "                },\n",
    "                \"model2\": {\n",
    "                    \"output\": m2['output'],\n",
    "                    \"nearest_neighbors\": rounded_nn2\n",
    "                }\n",
    "            }\n",
    "\n",
    "            combined_details.append(combined_entry)\n",
    "    return combined_details"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a6c2fd97-2cfe-4ae8-a098-07065adb8303",
   "metadata": {},
   "outputs": [],
   "source": [
    "combined_details_verb = get_combined_details(model1_details_verb, model2_details_verb)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b4535fa8-bbbf-48a6-a1f7-fe16d04f0e86",
   "metadata": {},
   "outputs": [],
   "source": [
    "combined_details_gen = get_combined_details(model1_details_gen, model2_details_gen)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "457066ab",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "id": "43a1d4fa-fb39-46e7-8c14-645e213aa7f3",
   "metadata": {},
   "source": [
    "#### Sample Data Creation"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a4c67e91-d622-4a73-bedd-f3535c46c5a1",
   "metadata": {},
   "outputs": [],
   "source": [
    "def write_data(data, file_name, varname):\n",
    "    datastr = f\"\\n{varname} = {data}\"\n",
    "    \n",
    "    # Write this string to the file\n",
    "    with open(file_name, 'a') as file:\n",
    "        file.write(datastr)\n",
    "\n",
    "# This stays constant for this iPython file\n",
    "FILE_NAME = \"./../samples/blood/level_3.py\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "166d67f7-55ae-4e56-8ee5-a45649a95bf0",
   "metadata": {},
   "outputs": [],
   "source": [
    "print(f\"Number of mismatched samples: {np.sum(y_pred_1 != y_pred_2)}\")\n",
    "np.where(y_pred_1 != y_pred_2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 57,
   "id": "d2ba908c-9ccc-43ed-aebc-34c5e3eeac92",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Number of samples in verb_data: 150\n"
     ]
    }
   ],
   "source": [
    "verb_data = []\n",
    "for idx in range(len(X_test_scaled_df)):\n",
    "    data_point = {\n",
    "        \"input\": round_values(X_test_scaled_df.iloc[idx].to_list()),\n",
    "        \"output\": {\n",
    "            \"model1\": int(y_pred_1[idx]),\n",
    "            \"model2\": int(y_pred_2[idx])\n",
    "        }\n",
    "    }\n",
    "    verb_data.append(data_point)\n",
    "\n",
    "print(f\"Number of samples in verb_data: {len(verb_data)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e4051e96-5b23-4745-9954-d55495df2008",
   "metadata": {},
   "outputs": [],
   "source": [
    "verb_data_second = [{\"input\": i['input'], \"output\": {\"model1\": i[\"model1\"][\"output\"], \"model2\": i[\"model2\"][\"output\"]}} for i in combined_details_verb]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ba2e31c9-b037-4a66-8d9f-b17fd97e02cf",
   "metadata": {},
   "outputs": [],
   "source": [
    "verb_data == verb_data_second"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8444496e-6189-430b-bd90-5ff71426534c",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "97da7c78-ebf8-4ce7-913f-88dc065fcf6e",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ca8a8550-1c56-4a9b-b73a-0d24e3c318fd",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8b0374cf-250d-4b9c-ad17-b30db0b6d8bf",
   "metadata": {},
   "outputs": [],
   "source": [
    "varname = \"verb_data\"\n",
    "data = verb_data\n",
    "write_data(data, FILE_NAME, varname)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "32b9d1e8-7c1a-4839-8b3f-05eea5e03bcc",
   "metadata": {},
   "outputs": [],
   "source": [
    "y_gen_pred_1 = model1.predict(X_test_gen_scaled_df)\n",
    "y_gen_pred_2 = model2.predict(X_test_gen_scaled_df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5b11b0a3-deea-4f17-99f7-c992d2b470df",
   "metadata": {},
   "outputs": [],
   "source": [
    "gen_data = []\n",
    "for idx in range(len(X_test_gen_scaled_df)):\n",
    "    data_point = {\n",
    "        \"input\": round_values(X_test_gen_scaled_df.iloc[idx].to_list()),\n",
    "        \"output\": {\n",
    "            \"model1\": int(y_gen_pred_1[idx]),\n",
    "            \"model2\": int(y_gen_pred_2[idx])\n",
    "        }\n",
    "    }\n",
    "    gen_data.append(data_point)\n",
    "\n",
    "print(f\"Number of samples in gen_data: {len(gen_data)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "64268a33-c206-4002-b456-f9ed0d5651dc",
   "metadata": {},
   "outputs": [],
   "source": [
    "varname = \"gen_data\"\n",
    "data = gen_data\n",
    "write_data(data, FILE_NAME, varname)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f132e020-5ee2-4c63-94a1-ab02b41d9a52",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "569c615f-6aaa-42a0-bd78-57f67a13c8fa",
   "metadata": {},
   "outputs": [],
   "source": [
    "def prune_data(gen_data):\n",
    "    return [{\"input\": inst[\"input\"], \"output\": {\"model1\": inst[\"output\"][\"model1\"]}} for inst in gen_data]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ca15745c-cc52-4855-a227-06aef729d537",
   "metadata": {},
   "outputs": [],
   "source": [
    "varname = \"gen_data_pruned\"\n",
    "data = prune_data(gen_data)\n",
    "write_data(data, FILE_NAME, varname)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "39486abe-a340-480f-a7e4-8449c05d372d",
   "metadata": {},
   "outputs": [],
   "source": [
    "def write_structures(structure_text, file_name, varname):\n",
    "    datastr = f\"\\n{varname} = {structure_text}\"\n",
    "    \n",
    "    # write this string to the file\n",
    "    with open(file_name, 'a') as file:\n",
    "        file.write(datastr)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1ffcfa7d-c895-42f0-bee6-dec69c44e339",
   "metadata": {},
   "outputs": [],
   "source": [
    "STRUCTURES_FILE_NAME = \"./../structures/blood/level_3.py\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "59b12448-1adf-43a5-bdad-c3b85be3fcc1",
   "metadata": {},
   "outputs": [],
   "source": [
    "write_structures(combined_details_verb, STRUCTURES_FILE_NAME, \"combined_details_verb\")\n",
    "write_structures(combined_details_gen, STRUCTURES_FILE_NAME, \"combined_details_gen\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3e988969-a87e-42f7-8a5e-d161adb0d32a",
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_accuracy(a, b):\n",
    "    correct = 0\n",
    "    total = len(a)\n",
    "    \n",
    "    for i in range(len(a)):\n",
    "        if(a[i]['input'] == b[i]['input']):\n",
    "            if(a[i]['output']['model2'] == b[i]['output']['model2']):\n",
    "                correct += 1\n",
    "        else:\n",
    "            print(\"Mismatch\")\n",
    "            print(a[i])\n",
    "            print(b[i])\n",
    "            print(\"\\n\\n\\n\")\n",
    "    \n",
    "    print(correct)\n",
    "    print(correct/total)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6e2e5462-92f8-43f3-9f15-c39d7a3c2916",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ad485001-fb0e-4ad4-a968-40ce44e0a33c",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "23cd5e81-71ca-405f-a26e-836a19e3fcab",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "432aac87-4b82-4366-8b72-6b1c2951d782",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "79f05dff-21c8-4b96-93ed-534230524c65",
   "metadata": {},
   "outputs": [],
   "source": [
    "def prediction_zero(data):\n",
    "    prediction0_1 = [i for i in range(len(data)) if data[i][\"output\"][\"model1\"] == 0]\n",
    "    prediction0_2 = [i for i in range(len(data)) if data[i][\"output\"][\"model2\"] == 0]\n",
    "    return prediction0_1, prediction0_2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "473a513b-6dea-497a-b710-5345bfb2a264",
   "metadata": {},
   "outputs": [],
   "source": [
    "print(f\"Model 1: {len(prediction_zero(verb_data)[0])}\")\n",
    "print(f\"Model 2: {len(prediction_zero(verb_data)[1])}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9e6a9ebd-fc67-4823-9f8c-b9e79ec94b4d",
   "metadata": {},
   "outputs": [],
   "source": [
    "print(f\"Model 1: {len(prediction_zero(gen_data)[0])}\")\n",
    "print(f\"Model 2: {len(prediction_zero(gen_data)[1])}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "067d9623-2ef6-4253-a6a8-515e2ec355a2",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "11eaf5cb-3c36-4760-9e38-21725f728e67",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d9d4cd0b-c7dc-4063-a4bd-c37338661d12",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Function to round data and analyze variance\n",
    "def analyze_precision(df, column, decimal_places):\n",
    "    results = []\n",
    "    for decimals in decimal_places:\n",
    "        df_rounded = df.copy()\n",
    "        df_rounded[column] = df_rounded[column].round(decimals)\n",
    "        variance = df_rounded[column].var()\n",
    "        results.append((decimals, variance))\n",
    "    return pd.DataFrame(results, columns=['Decimals', 'Variance'])\n",
    "\n",
    "# Analyze precision from 0 to 5 decimal places\n",
    "precision_analysis_1 = analyze_precision(X_train_scaled_df, 'Recency (months)', range(7))\n",
    "precision_analysis_2 = analyze_precision(X_train_scaled_df, 'Frequency (times)', range(7))\n",
    "precision_analysis_3 = analyze_precision(X_train_scaled_df, 'Monetary (c.c. blood)', range(7))\n",
    "precision_analysis_4 = analyze_precision(X_train_scaled_df, 'Time (months)', range(7))\n",
    "\n",
    "print(precision_analysis_1)\n",
    "print(precision_analysis_2)\n",
    "print(precision_analysis_3)\n",
    "print(precision_analysis_4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "898835e4-cd64-4c6b-854d-16acb0ffd8b7",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9806ca77",
   "metadata": {},
   "outputs": [],
   "source": [
    "mismatches = [i for i in gen_data if i[\"output\"][\"model1\"] != i[\"output\"][\"model2\"]]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1af5df0f-de07-4c56-89c0-dcdbb5b578cb",
   "metadata": {},
   "outputs": [],
   "source": [
    "mismatches"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ed9c4c85-ad54-4717-b43f-a99bf0fb4e73",
   "metadata": {},
   "outputs": [],
   "source": [
    "len(mismatches)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0fb156d4-9804-454a-a9d9-8c4d8a11ef13",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3d0d8f47-a535-4bf5-a695-094a683eea07",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 64,
   "id": "367c80af-5835-471c-8a34-215670a67db2",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<style>#sk-container-id-11 {\n",
       "  /* Definition of color scheme common for light and dark mode */\n",
       "  --sklearn-color-text: black;\n",
       "  --sklearn-color-line: gray;\n",
       "  /* Definition of color scheme for unfitted estimators */\n",
       "  --sklearn-color-unfitted-level-0: #fff5e6;\n",
       "  --sklearn-color-unfitted-level-1: #f6e4d2;\n",
       "  --sklearn-color-unfitted-level-2: #ffe0b3;\n",
       "  --sklearn-color-unfitted-level-3: chocolate;\n",
       "  /* Definition of color scheme for fitted estimators */\n",
       "  --sklearn-color-fitted-level-0: #f0f8ff;\n",
       "  --sklearn-color-fitted-level-1: #d4ebff;\n",
       "  --sklearn-color-fitted-level-2: #b3dbfd;\n",
       "  --sklearn-color-fitted-level-3: cornflowerblue;\n",
       "\n",
       "  /* Specific color for light theme */\n",
       "  --sklearn-color-text-on-default-background: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, black)));\n",
       "  --sklearn-color-background: var(--sg-background-color, var(--theme-background, var(--jp-layout-color0, white)));\n",
       "  --sklearn-color-border-box: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, black)));\n",
       "  --sklearn-color-icon: #696969;\n",
       "\n",
       "  @media (prefers-color-scheme: dark) {\n",
       "    /* Redefinition of color scheme for dark theme */\n",
       "    --sklearn-color-text-on-default-background: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, white)));\n",
       "    --sklearn-color-background: var(--sg-background-color, var(--theme-background, var(--jp-layout-color0, #111)));\n",
       "    --sklearn-color-border-box: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, white)));\n",
       "    --sklearn-color-icon: #878787;\n",
       "  }\n",
       "}\n",
       "\n",
       "#sk-container-id-11 {\n",
       "  color: var(--sklearn-color-text);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 pre {\n",
       "  padding: 0;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 input.sk-hidden--visually {\n",
       "  border: 0;\n",
       "  clip: rect(1px 1px 1px 1px);\n",
       "  clip: rect(1px, 1px, 1px, 1px);\n",
       "  height: 1px;\n",
       "  margin: -1px;\n",
       "  overflow: hidden;\n",
       "  padding: 0;\n",
       "  position: absolute;\n",
       "  width: 1px;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-dashed-wrapped {\n",
       "  border: 1px dashed var(--sklearn-color-line);\n",
       "  margin: 0 0.4em 0.5em 0.4em;\n",
       "  box-sizing: border-box;\n",
       "  padding-bottom: 0.4em;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-container {\n",
       "  /* jupyter's `normalize.less` sets `[hidden] { display: none; }`\n",
       "     but bootstrap.min.css set `[hidden] { display: none !important; }`\n",
       "     so we also need the `!important` here to be able to override the\n",
       "     default hidden behavior on the sphinx rendered scikit-learn.org.\n",
       "     See: https://github.com/scikit-learn/scikit-learn/issues/21755 */\n",
       "  display: inline-block !important;\n",
       "  position: relative;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-text-repr-fallback {\n",
       "  display: none;\n",
       "}\n",
       "\n",
       "div.sk-parallel-item,\n",
       "div.sk-serial,\n",
       "div.sk-item {\n",
       "  /* draw centered vertical line to link estimators */\n",
       "  background-image: linear-gradient(var(--sklearn-color-text-on-default-background), var(--sklearn-color-text-on-default-background));\n",
       "  background-size: 2px 100%;\n",
       "  background-repeat: no-repeat;\n",
       "  background-position: center center;\n",
       "}\n",
       "\n",
       "/* Parallel-specific style estimator block */\n",
       "\n",
       "#sk-container-id-11 div.sk-parallel-item::after {\n",
       "  content: \"\";\n",
       "  width: 100%;\n",
       "  border-bottom: 2px solid var(--sklearn-color-text-on-default-background);\n",
       "  flex-grow: 1;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-parallel {\n",
       "  display: flex;\n",
       "  align-items: stretch;\n",
       "  justify-content: center;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "  position: relative;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-parallel-item {\n",
       "  display: flex;\n",
       "  flex-direction: column;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-parallel-item:first-child::after {\n",
       "  align-self: flex-end;\n",
       "  width: 50%;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-parallel-item:last-child::after {\n",
       "  align-self: flex-start;\n",
       "  width: 50%;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-parallel-item:only-child::after {\n",
       "  width: 0;\n",
       "}\n",
       "\n",
       "/* Serial-specific style estimator block */\n",
       "\n",
       "#sk-container-id-11 div.sk-serial {\n",
       "  display: flex;\n",
       "  flex-direction: column;\n",
       "  align-items: center;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "  padding-right: 1em;\n",
       "  padding-left: 1em;\n",
       "}\n",
       "\n",
       "\n",
       "/* Toggleable style: style used for estimator/Pipeline/ColumnTransformer box that is\n",
       "clickable and can be expanded/collapsed.\n",
       "- Pipeline and ColumnTransformer use this feature and define the default style\n",
       "- Estimators will overwrite some part of the style using the `sk-estimator` class\n",
       "*/\n",
       "\n",
       "/* Pipeline and ColumnTransformer style (default) */\n",
       "\n",
       "#sk-container-id-11 div.sk-toggleable {\n",
       "  /* Default theme specific background. It is overwritten whether we have a\n",
       "  specific estimator or a Pipeline/ColumnTransformer */\n",
       "  background-color: var(--sklearn-color-background);\n",
       "}\n",
       "\n",
       "/* Toggleable label */\n",
       "#sk-container-id-11 label.sk-toggleable__label {\n",
       "  cursor: pointer;\n",
       "  display: block;\n",
       "  width: 100%;\n",
       "  margin-bottom: 0;\n",
       "  padding: 0.5em;\n",
       "  box-sizing: border-box;\n",
       "  text-align: center;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 label.sk-toggleable__label-arrow:before {\n",
       "  /* Arrow on the left of the label */\n",
       "  content: \"▸\";\n",
       "  float: left;\n",
       "  margin-right: 0.25em;\n",
       "  color: var(--sklearn-color-icon);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 label.sk-toggleable__label-arrow:hover:before {\n",
       "  color: var(--sklearn-color-text);\n",
       "}\n",
       "\n",
       "/* Toggleable content - dropdown */\n",
       "\n",
       "#sk-container-id-11 div.sk-toggleable__content {\n",
       "  max-height: 0;\n",
       "  max-width: 0;\n",
       "  overflow: hidden;\n",
       "  text-align: left;\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-toggleable__content.fitted {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-toggleable__content pre {\n",
       "  margin: 0.2em;\n",
       "  border-radius: 0.25em;\n",
       "  color: var(--sklearn-color-text);\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-toggleable__content.fitted pre {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 input.sk-toggleable__control:checked~div.sk-toggleable__content {\n",
       "  /* Expand drop-down */\n",
       "  max-height: 200px;\n",
       "  max-width: 100%;\n",
       "  overflow: auto;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {\n",
       "  content: \"▾\";\n",
       "}\n",
       "\n",
       "/* Pipeline/ColumnTransformer-specific style */\n",
       "\n",
       "#sk-container-id-11 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {\n",
       "  color: var(--sklearn-color-text);\n",
       "  background-color: var(--sklearn-color-unfitted-level-2);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-label.fitted input.sk-toggleable__control:checked~label.sk-toggleable__label {\n",
       "  background-color: var(--sklearn-color-fitted-level-2);\n",
       "}\n",
       "\n",
       "/* Estimator-specific style */\n",
       "\n",
       "/* Colorize estimator box */\n",
       "#sk-container-id-11 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-2);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-estimator.fitted input.sk-toggleable__control:checked~label.sk-toggleable__label {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-2);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-label label.sk-toggleable__label,\n",
       "#sk-container-id-11 div.sk-label label {\n",
       "  /* The background is the default theme color */\n",
       "  color: var(--sklearn-color-text-on-default-background);\n",
       "}\n",
       "\n",
       "/* On hover, darken the color of the background */\n",
       "#sk-container-id-11 div.sk-label:hover label.sk-toggleable__label {\n",
       "  color: var(--sklearn-color-text);\n",
       "  background-color: var(--sklearn-color-unfitted-level-2);\n",
       "}\n",
       "\n",
       "/* Label box, darken color on hover, fitted */\n",
       "#sk-container-id-11 div.sk-label.fitted:hover label.sk-toggleable__label.fitted {\n",
       "  color: var(--sklearn-color-text);\n",
       "  background-color: var(--sklearn-color-fitted-level-2);\n",
       "}\n",
       "\n",
       "/* Estimator label */\n",
       "\n",
       "#sk-container-id-11 div.sk-label label {\n",
       "  font-family: monospace;\n",
       "  font-weight: bold;\n",
       "  display: inline-block;\n",
       "  line-height: 1.2em;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-label-container {\n",
       "  text-align: center;\n",
       "}\n",
       "\n",
       "/* Estimator-specific */\n",
       "#sk-container-id-11 div.sk-estimator {\n",
       "  font-family: monospace;\n",
       "  border: 1px dotted var(--sklearn-color-border-box);\n",
       "  border-radius: 0.25em;\n",
       "  box-sizing: border-box;\n",
       "  margin-bottom: 0.5em;\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-estimator.fitted {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-0);\n",
       "}\n",
       "\n",
       "/* on hover */\n",
       "#sk-container-id-11 div.sk-estimator:hover {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-2);\n",
       "}\n",
       "\n",
       "#sk-container-id-11 div.sk-estimator.fitted:hover {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-2);\n",
       "}\n",
       "\n",
       "/* Specification for estimator info (e.g. \"i\" and \"?\") */\n",
       "\n",
       "/* Common style for \"i\" and \"?\" */\n",
       "\n",
       ".sk-estimator-doc-link,\n",
       "a:link.sk-estimator-doc-link,\n",
       "a:visited.sk-estimator-doc-link {\n",
       "  float: right;\n",
       "  font-size: smaller;\n",
       "  line-height: 1em;\n",
       "  font-family: monospace;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "  border-radius: 1em;\n",
       "  height: 1em;\n",
       "  width: 1em;\n",
       "  text-decoration: none !important;\n",
       "  margin-left: 1ex;\n",
       "  /* unfitted */\n",
       "  border: var(--sklearn-color-unfitted-level-1) 1pt solid;\n",
       "  color: var(--sklearn-color-unfitted-level-1);\n",
       "}\n",
       "\n",
       ".sk-estimator-doc-link.fitted,\n",
       "a:link.sk-estimator-doc-link.fitted,\n",
       "a:visited.sk-estimator-doc-link.fitted {\n",
       "  /* fitted */\n",
       "  border: var(--sklearn-color-fitted-level-1) 1pt solid;\n",
       "  color: var(--sklearn-color-fitted-level-1);\n",
       "}\n",
       "\n",
       "/* On hover */\n",
       "div.sk-estimator:hover .sk-estimator-doc-link:hover,\n",
       ".sk-estimator-doc-link:hover,\n",
       "div.sk-label-container:hover .sk-estimator-doc-link:hover,\n",
       ".sk-estimator-doc-link:hover {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-3);\n",
       "  color: var(--sklearn-color-background);\n",
       "  text-decoration: none;\n",
       "}\n",
       "\n",
       "div.sk-estimator.fitted:hover .sk-estimator-doc-link.fitted:hover,\n",
       ".sk-estimator-doc-link.fitted:hover,\n",
       "div.sk-label-container:hover .sk-estimator-doc-link.fitted:hover,\n",
       ".sk-estimator-doc-link.fitted:hover {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-3);\n",
       "  color: var(--sklearn-color-background);\n",
       "  text-decoration: none;\n",
       "}\n",
       "\n",
       "/* Span, style for the box shown on hovering the info icon */\n",
       ".sk-estimator-doc-link span {\n",
       "  display: none;\n",
       "  z-index: 9999;\n",
       "  position: relative;\n",
       "  font-weight: normal;\n",
       "  right: .2ex;\n",
       "  padding: .5ex;\n",
       "  margin: .5ex;\n",
       "  width: min-content;\n",
       "  min-width: 20ex;\n",
       "  max-width: 50ex;\n",
       "  color: var(--sklearn-color-text);\n",
       "  box-shadow: 2pt 2pt 4pt #999;\n",
       "  /* unfitted */\n",
       "  background: var(--sklearn-color-unfitted-level-0);\n",
       "  border: .5pt solid var(--sklearn-color-unfitted-level-3);\n",
       "}\n",
       "\n",
       ".sk-estimator-doc-link.fitted span {\n",
       "  /* fitted */\n",
       "  background: var(--sklearn-color-fitted-level-0);\n",
       "  border: var(--sklearn-color-fitted-level-3);\n",
       "}\n",
       "\n",
       ".sk-estimator-doc-link:hover span {\n",
       "  display: block;\n",
       "}\n",
       "\n",
       "/* \"?\"-specific style due to the `<a>` HTML tag */\n",
       "\n",
       "#sk-container-id-11 a.estimator_doc_link {\n",
       "  float: right;\n",
       "  font-size: 1rem;\n",
       "  line-height: 1em;\n",
       "  font-family: monospace;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "  border-radius: 1rem;\n",
       "  height: 1rem;\n",
       "  width: 1rem;\n",
       "  text-decoration: none;\n",
       "  /* unfitted */\n",
       "  color: var(--sklearn-color-unfitted-level-1);\n",
       "  border: var(--sklearn-color-unfitted-level-1) 1pt solid;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 a.estimator_doc_link.fitted {\n",
       "  /* fitted */\n",
       "  border: var(--sklearn-color-fitted-level-1) 1pt solid;\n",
       "  color: var(--sklearn-color-fitted-level-1);\n",
       "}\n",
       "\n",
       "/* On hover */\n",
       "#sk-container-id-11 a.estimator_doc_link:hover {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-3);\n",
       "  color: var(--sklearn-color-background);\n",
       "  text-decoration: none;\n",
       "}\n",
       "\n",
       "#sk-container-id-11 a.estimator_doc_link.fitted:hover {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-3);\n",
       "}\n",
       "</style><div id=\"sk-container-id-11\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>KNeighborsClassifier(algorithm=np.str_(&#x27;brute&#x27;), leaf_size=19, n_neighbors=1,\n",
       "                     p=np.float64(inf), weights=np.str_(&#x27;distance&#x27;))</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item\"><div class=\"sk-estimator fitted sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-11\" type=\"checkbox\" checked><label for=\"sk-estimator-id-11\" class=\"sk-toggleable__label fitted sk-toggleable__label-arrow fitted\">&nbsp;&nbsp;KNeighborsClassifier<a class=\"sk-estimator-doc-link fitted\" rel=\"noreferrer\" target=\"_blank\" href=\"https://scikit-learn.org/1.5/modules/generated/sklearn.neighbors.KNeighborsClassifier.html\">?<span>Documentation for KNeighborsClassifier</span></a><span class=\"sk-estimator-doc-link fitted\">i<span>Fitted</span></span></label><div class=\"sk-toggleable__content fitted\"><pre>KNeighborsClassifier(algorithm=np.str_(&#x27;brute&#x27;), leaf_size=19, n_neighbors=1,\n",
       "                     p=np.float64(inf), weights=np.str_(&#x27;distance&#x27;))</pre></div> </div></div></div></div>"
      ],
      "text/plain": [
       "KNeighborsClassifier(algorithm=np.str_('brute'), leaf_size=19, n_neighbors=1,\n",
       "                     p=np.float64(inf), weights=np.str_('distance'))"
      ]
     },
     "execution_count": 64,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model1 = KNeighborsClassifier(algorithm=np.str_('brute'), leaf_size=19, metric='minkowski', metric_params=None, n_jobs=None, n_neighbors=1, p=np.float64(np.inf), weights=np.str_('distance'))\n",
    "model1.fit(X_train_scaled_df, y_train)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 65,
   "id": "96019376-c72e-4796-ac5c-6c5cee450b82",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<style>#sk-container-id-12 {\n",
       "  /* Definition of color scheme common for light and dark mode */\n",
       "  --sklearn-color-text: black;\n",
       "  --sklearn-color-line: gray;\n",
       "  /* Definition of color scheme for unfitted estimators */\n",
       "  --sklearn-color-unfitted-level-0: #fff5e6;\n",
       "  --sklearn-color-unfitted-level-1: #f6e4d2;\n",
       "  --sklearn-color-unfitted-level-2: #ffe0b3;\n",
       "  --sklearn-color-unfitted-level-3: chocolate;\n",
       "  /* Definition of color scheme for fitted estimators */\n",
       "  --sklearn-color-fitted-level-0: #f0f8ff;\n",
       "  --sklearn-color-fitted-level-1: #d4ebff;\n",
       "  --sklearn-color-fitted-level-2: #b3dbfd;\n",
       "  --sklearn-color-fitted-level-3: cornflowerblue;\n",
       "\n",
       "  /* Specific color for light theme */\n",
       "  --sklearn-color-text-on-default-background: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, black)));\n",
       "  --sklearn-color-background: var(--sg-background-color, var(--theme-background, var(--jp-layout-color0, white)));\n",
       "  --sklearn-color-border-box: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, black)));\n",
       "  --sklearn-color-icon: #696969;\n",
       "\n",
       "  @media (prefers-color-scheme: dark) {\n",
       "    /* Redefinition of color scheme for dark theme */\n",
       "    --sklearn-color-text-on-default-background: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, white)));\n",
       "    --sklearn-color-background: var(--sg-background-color, var(--theme-background, var(--jp-layout-color0, #111)));\n",
       "    --sklearn-color-border-box: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, white)));\n",
       "    --sklearn-color-icon: #878787;\n",
       "  }\n",
       "}\n",
       "\n",
       "#sk-container-id-12 {\n",
       "  color: var(--sklearn-color-text);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 pre {\n",
       "  padding: 0;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 input.sk-hidden--visually {\n",
       "  border: 0;\n",
       "  clip: rect(1px 1px 1px 1px);\n",
       "  clip: rect(1px, 1px, 1px, 1px);\n",
       "  height: 1px;\n",
       "  margin: -1px;\n",
       "  overflow: hidden;\n",
       "  padding: 0;\n",
       "  position: absolute;\n",
       "  width: 1px;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-dashed-wrapped {\n",
       "  border: 1px dashed var(--sklearn-color-line);\n",
       "  margin: 0 0.4em 0.5em 0.4em;\n",
       "  box-sizing: border-box;\n",
       "  padding-bottom: 0.4em;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-container {\n",
       "  /* jupyter's `normalize.less` sets `[hidden] { display: none; }`\n",
       "     but bootstrap.min.css set `[hidden] { display: none !important; }`\n",
       "     so we also need the `!important` here to be able to override the\n",
       "     default hidden behavior on the sphinx rendered scikit-learn.org.\n",
       "     See: https://github.com/scikit-learn/scikit-learn/issues/21755 */\n",
       "  display: inline-block !important;\n",
       "  position: relative;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-text-repr-fallback {\n",
       "  display: none;\n",
       "}\n",
       "\n",
       "div.sk-parallel-item,\n",
       "div.sk-serial,\n",
       "div.sk-item {\n",
       "  /* draw centered vertical line to link estimators */\n",
       "  background-image: linear-gradient(var(--sklearn-color-text-on-default-background), var(--sklearn-color-text-on-default-background));\n",
       "  background-size: 2px 100%;\n",
       "  background-repeat: no-repeat;\n",
       "  background-position: center center;\n",
       "}\n",
       "\n",
       "/* Parallel-specific style estimator block */\n",
       "\n",
       "#sk-container-id-12 div.sk-parallel-item::after {\n",
       "  content: \"\";\n",
       "  width: 100%;\n",
       "  border-bottom: 2px solid var(--sklearn-color-text-on-default-background);\n",
       "  flex-grow: 1;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-parallel {\n",
       "  display: flex;\n",
       "  align-items: stretch;\n",
       "  justify-content: center;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "  position: relative;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-parallel-item {\n",
       "  display: flex;\n",
       "  flex-direction: column;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-parallel-item:first-child::after {\n",
       "  align-self: flex-end;\n",
       "  width: 50%;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-parallel-item:last-child::after {\n",
       "  align-self: flex-start;\n",
       "  width: 50%;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-parallel-item:only-child::after {\n",
       "  width: 0;\n",
       "}\n",
       "\n",
       "/* Serial-specific style estimator block */\n",
       "\n",
       "#sk-container-id-12 div.sk-serial {\n",
       "  display: flex;\n",
       "  flex-direction: column;\n",
       "  align-items: center;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "  padding-right: 1em;\n",
       "  padding-left: 1em;\n",
       "}\n",
       "\n",
       "\n",
       "/* Toggleable style: style used for estimator/Pipeline/ColumnTransformer box that is\n",
       "clickable and can be expanded/collapsed.\n",
       "- Pipeline and ColumnTransformer use this feature and define the default style\n",
       "- Estimators will overwrite some part of the style using the `sk-estimator` class\n",
       "*/\n",
       "\n",
       "/* Pipeline and ColumnTransformer style (default) */\n",
       "\n",
       "#sk-container-id-12 div.sk-toggleable {\n",
       "  /* Default theme specific background. It is overwritten whether we have a\n",
       "  specific estimator or a Pipeline/ColumnTransformer */\n",
       "  background-color: var(--sklearn-color-background);\n",
       "}\n",
       "\n",
       "/* Toggleable label */\n",
       "#sk-container-id-12 label.sk-toggleable__label {\n",
       "  cursor: pointer;\n",
       "  display: block;\n",
       "  width: 100%;\n",
       "  margin-bottom: 0;\n",
       "  padding: 0.5em;\n",
       "  box-sizing: border-box;\n",
       "  text-align: center;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 label.sk-toggleable__label-arrow:before {\n",
       "  /* Arrow on the left of the label */\n",
       "  content: \"▸\";\n",
       "  float: left;\n",
       "  margin-right: 0.25em;\n",
       "  color: var(--sklearn-color-icon);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 label.sk-toggleable__label-arrow:hover:before {\n",
       "  color: var(--sklearn-color-text);\n",
       "}\n",
       "\n",
       "/* Toggleable content - dropdown */\n",
       "\n",
       "#sk-container-id-12 div.sk-toggleable__content {\n",
       "  max-height: 0;\n",
       "  max-width: 0;\n",
       "  overflow: hidden;\n",
       "  text-align: left;\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-toggleable__content.fitted {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-toggleable__content pre {\n",
       "  margin: 0.2em;\n",
       "  border-radius: 0.25em;\n",
       "  color: var(--sklearn-color-text);\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-toggleable__content.fitted pre {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 input.sk-toggleable__control:checked~div.sk-toggleable__content {\n",
       "  /* Expand drop-down */\n",
       "  max-height: 200px;\n",
       "  max-width: 100%;\n",
       "  overflow: auto;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {\n",
       "  content: \"▾\";\n",
       "}\n",
       "\n",
       "/* Pipeline/ColumnTransformer-specific style */\n",
       "\n",
       "#sk-container-id-12 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {\n",
       "  color: var(--sklearn-color-text);\n",
       "  background-color: var(--sklearn-color-unfitted-level-2);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-label.fitted input.sk-toggleable__control:checked~label.sk-toggleable__label {\n",
       "  background-color: var(--sklearn-color-fitted-level-2);\n",
       "}\n",
       "\n",
       "/* Estimator-specific style */\n",
       "\n",
       "/* Colorize estimator box */\n",
       "#sk-container-id-12 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-2);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-estimator.fitted input.sk-toggleable__control:checked~label.sk-toggleable__label {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-2);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-label label.sk-toggleable__label,\n",
       "#sk-container-id-12 div.sk-label label {\n",
       "  /* The background is the default theme color */\n",
       "  color: var(--sklearn-color-text-on-default-background);\n",
       "}\n",
       "\n",
       "/* On hover, darken the color of the background */\n",
       "#sk-container-id-12 div.sk-label:hover label.sk-toggleable__label {\n",
       "  color: var(--sklearn-color-text);\n",
       "  background-color: var(--sklearn-color-unfitted-level-2);\n",
       "}\n",
       "\n",
       "/* Label box, darken color on hover, fitted */\n",
       "#sk-container-id-12 div.sk-label.fitted:hover label.sk-toggleable__label.fitted {\n",
       "  color: var(--sklearn-color-text);\n",
       "  background-color: var(--sklearn-color-fitted-level-2);\n",
       "}\n",
       "\n",
       "/* Estimator label */\n",
       "\n",
       "#sk-container-id-12 div.sk-label label {\n",
       "  font-family: monospace;\n",
       "  font-weight: bold;\n",
       "  display: inline-block;\n",
       "  line-height: 1.2em;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-label-container {\n",
       "  text-align: center;\n",
       "}\n",
       "\n",
       "/* Estimator-specific */\n",
       "#sk-container-id-12 div.sk-estimator {\n",
       "  font-family: monospace;\n",
       "  border: 1px dotted var(--sklearn-color-border-box);\n",
       "  border-radius: 0.25em;\n",
       "  box-sizing: border-box;\n",
       "  margin-bottom: 0.5em;\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-0);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-estimator.fitted {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-0);\n",
       "}\n",
       "\n",
       "/* on hover */\n",
       "#sk-container-id-12 div.sk-estimator:hover {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-2);\n",
       "}\n",
       "\n",
       "#sk-container-id-12 div.sk-estimator.fitted:hover {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-2);\n",
       "}\n",
       "\n",
       "/* Specification for estimator info (e.g. \"i\" and \"?\") */\n",
       "\n",
       "/* Common style for \"i\" and \"?\" */\n",
       "\n",
       ".sk-estimator-doc-link,\n",
       "a:link.sk-estimator-doc-link,\n",
       "a:visited.sk-estimator-doc-link {\n",
       "  float: right;\n",
       "  font-size: smaller;\n",
       "  line-height: 1em;\n",
       "  font-family: monospace;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "  border-radius: 1em;\n",
       "  height: 1em;\n",
       "  width: 1em;\n",
       "  text-decoration: none !important;\n",
       "  margin-left: 1ex;\n",
       "  /* unfitted */\n",
       "  border: var(--sklearn-color-unfitted-level-1) 1pt solid;\n",
       "  color: var(--sklearn-color-unfitted-level-1);\n",
       "}\n",
       "\n",
       ".sk-estimator-doc-link.fitted,\n",
       "a:link.sk-estimator-doc-link.fitted,\n",
       "a:visited.sk-estimator-doc-link.fitted {\n",
       "  /* fitted */\n",
       "  border: var(--sklearn-color-fitted-level-1) 1pt solid;\n",
       "  color: var(--sklearn-color-fitted-level-1);\n",
       "}\n",
       "\n",
       "/* On hover */\n",
       "div.sk-estimator:hover .sk-estimator-doc-link:hover,\n",
       ".sk-estimator-doc-link:hover,\n",
       "div.sk-label-container:hover .sk-estimator-doc-link:hover,\n",
       ".sk-estimator-doc-link:hover {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-3);\n",
       "  color: var(--sklearn-color-background);\n",
       "  text-decoration: none;\n",
       "}\n",
       "\n",
       "div.sk-estimator.fitted:hover .sk-estimator-doc-link.fitted:hover,\n",
       ".sk-estimator-doc-link.fitted:hover,\n",
       "div.sk-label-container:hover .sk-estimator-doc-link.fitted:hover,\n",
       ".sk-estimator-doc-link.fitted:hover {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-3);\n",
       "  color: var(--sklearn-color-background);\n",
       "  text-decoration: none;\n",
       "}\n",
       "\n",
       "/* Span, style for the box shown on hovering the info icon */\n",
       ".sk-estimator-doc-link span {\n",
       "  display: none;\n",
       "  z-index: 9999;\n",
       "  position: relative;\n",
       "  font-weight: normal;\n",
       "  right: .2ex;\n",
       "  padding: .5ex;\n",
       "  margin: .5ex;\n",
       "  width: min-content;\n",
       "  min-width: 20ex;\n",
       "  max-width: 50ex;\n",
       "  color: var(--sklearn-color-text);\n",
       "  box-shadow: 2pt 2pt 4pt #999;\n",
       "  /* unfitted */\n",
       "  background: var(--sklearn-color-unfitted-level-0);\n",
       "  border: .5pt solid var(--sklearn-color-unfitted-level-3);\n",
       "}\n",
       "\n",
       ".sk-estimator-doc-link.fitted span {\n",
       "  /* fitted */\n",
       "  background: var(--sklearn-color-fitted-level-0);\n",
       "  border: var(--sklearn-color-fitted-level-3);\n",
       "}\n",
       "\n",
       ".sk-estimator-doc-link:hover span {\n",
       "  display: block;\n",
       "}\n",
       "\n",
       "/* \"?\"-specific style due to the `<a>` HTML tag */\n",
       "\n",
       "#sk-container-id-12 a.estimator_doc_link {\n",
       "  float: right;\n",
       "  font-size: 1rem;\n",
       "  line-height: 1em;\n",
       "  font-family: monospace;\n",
       "  background-color: var(--sklearn-color-background);\n",
       "  border-radius: 1rem;\n",
       "  height: 1rem;\n",
       "  width: 1rem;\n",
       "  text-decoration: none;\n",
       "  /* unfitted */\n",
       "  color: var(--sklearn-color-unfitted-level-1);\n",
       "  border: var(--sklearn-color-unfitted-level-1) 1pt solid;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 a.estimator_doc_link.fitted {\n",
       "  /* fitted */\n",
       "  border: var(--sklearn-color-fitted-level-1) 1pt solid;\n",
       "  color: var(--sklearn-color-fitted-level-1);\n",
       "}\n",
       "\n",
       "/* On hover */\n",
       "#sk-container-id-12 a.estimator_doc_link:hover {\n",
       "  /* unfitted */\n",
       "  background-color: var(--sklearn-color-unfitted-level-3);\n",
       "  color: var(--sklearn-color-background);\n",
       "  text-decoration: none;\n",
       "}\n",
       "\n",
       "#sk-container-id-12 a.estimator_doc_link.fitted:hover {\n",
       "  /* fitted */\n",
       "  background-color: var(--sklearn-color-fitted-level-3);\n",
       "}\n",
       "</style><div id=\"sk-container-id-12\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>KNeighborsClassifier(p=3)</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item\"><div class=\"sk-estimator fitted sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-12\" type=\"checkbox\" checked><label for=\"sk-estimator-id-12\" class=\"sk-toggleable__label fitted sk-toggleable__label-arrow fitted\">&nbsp;&nbsp;KNeighborsClassifier<a class=\"sk-estimator-doc-link fitted\" rel=\"noreferrer\" target=\"_blank\" href=\"https://scikit-learn.org/1.5/modules/generated/sklearn.neighbors.KNeighborsClassifier.html\">?<span>Documentation for KNeighborsClassifier</span></a><span class=\"sk-estimator-doc-link fitted\">i<span>Fitted</span></span></label><div class=\"sk-toggleable__content fitted\"><pre>KNeighborsClassifier(p=3)</pre></div> </div></div></div></div>"
      ],
      "text/plain": [
       "KNeighborsClassifier(p=3)"
      ]
     },
     "execution_count": 65,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model2 = KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski', metric_params=None, n_jobs=None, n_neighbors=5, p=3, weights='uniform')\n",
    "model2.fit(X_train_scaled_df, y_train)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 66,
   "id": "94ed0313-9bd5-4776-9027-d4fc7df3791b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Model 1\n",
      "Model 1 accuracy: 0.64\n",
      "\n",
      "Model 2:\n",
      "Model 2 accuracy: 0.7533333333333333\n",
      "\n",
      "Accuracy difference: 0.11333333333333329\n",
      "\n",
      "\n",
      "\n",
      "{'algorithm': np.str_('brute'), 'leaf_size': 19, 'metric': 'minkowski', 'metric_params': None, 'n_jobs': None, 'n_neighbors': 1, 'p': np.float64(inf), 'weights': np.str_('distance')}\n",
      "{'algorithm': 'auto', 'leaf_size': 30, 'metric': 'minkowski', 'metric_params': None, 'n_jobs': None, 'n_neighbors': 5, 'p': 3, 'weights': 'uniform'}\n"
     ]
    }
   ],
   "source": [
    "# Evaluate both models\n",
    "y_pred_1 = model1.predict(X_test_scaled_df)\n",
    "y_pred_2 = model2.predict(X_test_scaled_df)\n",
    "\n",
    "accuracy1 = accuracy_score(y_test, y_pred_1)\n",
    "accuracy2 = accuracy_score(y_test, y_pred_2)\n",
    "\n",
    "# Print results\n",
    "print(f\"Model 1\")\n",
    "print(\"Model 1 accuracy:\", accuracy1)\n",
    "print(f\"\\nModel 2:\")\n",
    "print(\"Model 2 accuracy:\", accuracy2)\n",
    "print(\"\\nAccuracy difference:\", abs(accuracy1 - accuracy2))\n",
    "# print(f\"\\nPercentage of different outputs: {best_diff:.2%}\")\n",
    "\n",
    "print(\"\\n\\n\")\n",
    "print(model1.get_params())\n",
    "print(model2.get_params())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d3738abe-306e-43b3-b0c5-ac0f66ba6071",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "1948628d-62a8-44b9-b2c7-50b97f810d32",
   "metadata": {},
   "outputs": [],
   "source": [
    "verb_data1 = [{'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 67.376, 67.376, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [134.526, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, 171.584], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 612.688, 612.688, 268.08], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -12.817, -12.817, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 179.975], 'output': {'model1': 0, 'model2': 0}}, {'input': [358.964, -76.971, -76.971, 24.742], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [193.588, -12.817, -12.817, 62.501], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 131.531, 131.531, 217.734], 'output': {'model1': 0, 'model2': 1}}, {'input': [51.838, -44.894, -44.894, -54.972], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [99.088, 35.299, 35.299, 255.494], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -28.855, -28.855, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, 188.366], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 99.453, 99.453, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 24.742], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 158.998], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, 19.261, 19.261, 226.125], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -12.817, -12.817, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 150.607], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, -126.295], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 99.453, 99.453, -0.431], 'output': {'model1': 1, 'model2': 1}}, {'input': [-101.725, 19.261, 19.261, 96.065], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, 45.72], 'output': {'model1': 1, 'model2': 0}}, {'input': [-19.037, -60.932, -60.932, -75.95], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 175.78], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, -84.34], 'output': {'model1': 1, 'model2': 1}}, {'input': [16.4, -44.894, -44.894, 175.78], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-7.225, 51.338, 51.338, 83.479], 'output': {'model1': 0, 'model2': 1}}, {'input': [75.463, 19.261, 19.261, 247.103], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [-78.1, 3.222, 3.222, -54.972], 'output': {'model1': 1, 'model2': 1}}, {'input': [134.526, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -28.855, -28.855, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -44.894, -44.894, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -12.817, -12.817, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -96.927], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -60.932, -60.932, -105.318], 'output': {'model1': 1, 'model2': 1}}, {'input': [16.4, 3.222, 3.222, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, -17.213], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, -60.932, -60.932, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, -42.386], 'output': {'model1': 0, 'model2': 0}}, {'input': [40.026, -44.894, -44.894, -75.95], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 99.453, 99.453, 226.125], 'output': {'model1': 0, 'model2': 0}}, {'input': [-54.475, 131.531, 131.531, 217.734], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 83.415, 83.415, -46.581], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 0}}, {'input': [-78.1, -28.855, -28.855, -21.408], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, 67.376, 67.376, 62.501], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 83.415, 83.415, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [-113.537, 35.299, 35.299, 104.456], 'output': {'model1': 0, 'model2': 1}}, {'input': [16.4, 163.608, 163.608, 230.321], 'output': {'model1': 1, 'model2': 0}}, {'input': [75.463, -60.932, -60.932, 150.607], 'output': {'model1': 0, 'model2': 0}}, {'input': [-30.85, 131.531, 131.531, 58.306], 'output': {'model1': 1, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -96.927], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, 35.299, 35.299, 125.434], 'output': {'model1': 0, 'model2': 0}}, {'input': [-19.037, 147.569, 147.569, 179.975], 'output': {'model1': 1, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -28.855, -28.855, 96.065], 'output': {'model1': 0, 'model2': 0}}, {'input': [-19.037, 51.338, 51.338, 125.434], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, -8.822], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -101.122], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -28.855, -28.855, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, 16.351], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, -54.972], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -44.894, -44.894, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -44.894, -44.894, -54.972], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, 3.222, 3.222, 150.607], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 268.08], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 230.321], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, -50.777], 'output': {'model1': 1, 'model2': 1}}, {'input': [158.151, -44.894, -44.894, 58.306], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 200.952], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 35.299, 35.299, 24.742], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, -96.927], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 54.111], 'output': {'model1': 1, 'model2': 0}}, {'input': [75.463, 3.222, 3.222, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -60.932, -60.932, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -12.817, -12.817, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, 104.456], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 67.376, 67.376, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 131.531, 131.531, 24.742], 'output': {'model1': 1, 'model2': 1}}, {'input': [75.463, -44.894, -44.894, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [134.526, -76.971, -76.971, -54.972], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 51.338, 51.338, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, 221.93], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 117.043], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -44.894, -44.894, -50.777], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 51.338, 51.338, -25.604], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, -28.855, -28.855, -84.34], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, 54.111], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -28.855, -28.855, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, 19.261, 19.261, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [51.838, 19.261, 19.261, 158.998], 'output': {'model1': 0, 'model2': 0}}]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "ca213365-6813-46ab-b214-2c26b075a15c",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "verb_data == verb_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "id": "7427ca6e-acbd-46f8-9506-00849ca4d2ec",
   "metadata": {},
   "outputs": [],
   "source": [
    "verb_data2 = [{'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, 67.376, 67.376, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [134.526, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, 171.584], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 612.688, 612.688, 268.08], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -12.817, -12.817, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 179.975], 'output': {'model1': 0, 'model2': 0}}, {'input': [358.964, -76.971, -76.971, 24.742], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [193.588, -12.817, -12.817, 62.501], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 131.531, 131.531, 217.734], 'output': {'model1': 1, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, -54.972], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, 3.222, 3.222, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [99.088, 35.299, 35.299, 255.494], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -28.855, -28.855, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, 188.366], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 99.453, 99.453, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 24.742], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 158.998], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, 19.261, 19.261, 226.125], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 1}}, {'input': [51.838, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -12.817, -12.817, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 150.607], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -126.295], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, 99.453, 99.453, -0.431], 'output': {'model1': 1, 'model2': 1}}, {'input': [-101.725, 19.261, 19.261, 96.065], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, 45.72], 'output': {'model1': 0, 'model2': 1}}, {'input': [-19.037, -60.932, -60.932, -75.95], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, 19.261, 19.261, 175.78], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, -84.34], 'output': {'model1': 1, 'model2': 1}}, {'input': [16.4, -44.894, -44.894, 175.78], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-7.225, 51.338, 51.338, 83.479], 'output': {'model1': 0, 'model2': 1}}, {'input': [75.463, 19.261, 19.261, 247.103], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [-78.1, 3.222, 3.222, -54.972], 'output': {'model1': 1, 'model2': 1}}, {'input': [134.526, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -28.855, -28.855, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -44.894, -44.894, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -12.817, -12.817, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -96.927], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -60.932, -60.932, -105.318], 'output': {'model1': 0, 'model2': 1}}, {'input': [16.4, 3.222, 3.222, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, -17.213], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -60.932, -60.932, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, -42.386], 'output': {'model1': 0, 'model2': 0}}, {'input': [40.026, -44.894, -44.894, -75.95], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, 99.453, 99.453, 226.125], 'output': {'model1': 0, 'model2': 0}}, {'input': [-54.475, 131.531, 131.531, 217.734], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 83.415, 83.415, -46.581], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 1}}, {'input': [-78.1, -28.855, -28.855, -21.408], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, 67.376, 67.376, 62.501], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 83.415, 83.415, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [-113.537, 35.299, 35.299, 104.456], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 163.608, 163.608, 230.321], 'output': {'model1': 0, 'model2': 1}}, {'input': [75.463, -60.932, -60.932, 150.607], 'output': {'model1': 0, 'model2': 0}}, {'input': [-30.85, 131.531, 131.531, 58.306], 'output': {'model1': 1, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -96.927], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, 35.299, 35.299, 125.434], 'output': {'model1': 0, 'model2': 0}}, {'input': [-19.037, 147.569, 147.569, 179.975], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -28.855, -28.855, 96.065], 'output': {'model1': 0, 'model2': 0}}, {'input': [-19.037, 51.338, 51.338, 125.434], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, 19.261, 19.261, -8.822], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, -101.122], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -28.855, -28.855, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, 16.351], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, -54.972], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -44.894, -44.894, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -44.894, -44.894, -54.972], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, 3.222, 3.222, 150.607], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 268.08], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 230.321], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, -50.777], 'output': {'model1': 1, 'model2': 1}}, {'input': [158.151, -44.894, -44.894, 58.306], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 200.952], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 35.299, 35.299, 24.742], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -96.927], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, -44.894, -44.894, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 54.111], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 3.222, 3.222, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -60.932, -60.932, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -12.817, -12.817, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, 104.456], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 67.376, 67.376, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 131.531, 131.531, 24.742], 'output': {'model1': 1, 'model2': 1}}, {'input': [75.463, -44.894, -44.894, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [134.526, -76.971, -76.971, -54.972], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, -28.855, -28.855, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 51.338, 51.338, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, 221.93], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 117.043], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -44.894, -44.894, -50.777], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, 51.338, 51.338, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -28.855, -28.855, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, 54.111], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -28.855, -28.855, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, 19.261, 19.261, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [51.838, 19.261, 19.261, 158.998], 'output': {'model1': 0, 'model2': 0}}]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "id": "851e14da-a79b-4e84-84d5-07203d9a9b96",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 43,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "verb_data2 == verb_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "id": "29585843-e1b5-4c56-8f72-1d075588c528",
   "metadata": {},
   "outputs": [],
   "source": [
    "verb_data3 = [{'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, 67.376, 67.376, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [134.526, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, 171.584], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 612.688, 612.688, 268.08], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -12.817, -12.817, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 179.975], 'output': {'model1': 0, 'model2': 0}}, {'input': [358.964, -76.971, -76.971, 24.742], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 0, 'model2': 0}}, {'input': [193.588, -12.817, -12.817, 62.501], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 131.531, 131.531, 217.734], 'output': {'model1': 1, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, -54.972], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, -25.604], 'output': {'model1': 1, 'model2': 0}}, {'input': [99.088, 35.299, 35.299, 255.494], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -28.855, -28.855, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, 188.366], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 99.453, 99.453, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 24.742], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 158.998], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, 19.261, 19.261, 226.125], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [51.838, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -12.817, -12.817, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 150.607], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, 99.453, 99.453, -0.431], 'output': {'model1': 1, 'model2': 1}}, {'input': [-101.725, 19.261, 19.261, 96.065], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, 45.72], 'output': {'model1': 0, 'model2': 0}}, {'input': [-19.037, -60.932, -60.932, -75.95], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 175.78], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, -84.34], 'output': {'model1': 1, 'model2': 1}}, {'input': [16.4, -44.894, -44.894, 175.78], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 0, 'model2': 0}}, {'input': [-7.225, 51.338, 51.338, 83.479], 'output': {'model1': 1, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, 247.103], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [-78.1, 3.222, 3.222, -54.972], 'output': {'model1': 1, 'model2': 1}}, {'input': [134.526, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -28.855, -28.855, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -44.894, -44.894, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -12.817, -12.817, -75.95], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -12.817, -12.817, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -96.927], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -60.932, -60.932, -105.318], 'output': {'model1': 1, 'model2': 0}}, {'input': [16.4, 3.222, 3.222, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, -17.213], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -60.932, -60.932, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, -42.386], 'output': {'model1': 0, 'model2': 0}}, {'input': [40.026, -44.894, -44.894, -75.95], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 99.453, 99.453, 226.125], 'output': {'model1': 0, 'model2': 0}}, {'input': [-54.475, 131.531, 131.531, 217.734], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, 83.415, 83.415, -46.581], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-78.1, -28.855, -28.855, -21.408], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, 67.376, 67.376, 62.501], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 83.415, 83.415, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [-113.537, 35.299, 35.299, 104.456], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 163.608, 163.608, 230.321], 'output': {'model1': 1, 'model2': 0}}, {'input': [75.463, -60.932, -60.932, 150.607], 'output': {'model1': 0, 'model2': 0}}, {'input': [-30.85, 131.531, 131.531, 58.306], 'output': {'model1': 1, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -96.927], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, 35.299, 35.299, 125.434], 'output': {'model1': 0, 'model2': 0}}, {'input': [-19.037, 147.569, 147.569, 179.975], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -28.855, -28.855, 96.065], 'output': {'model1': 0, 'model2': 0}}, {'input': [-19.037, 51.338, 51.338, 125.434], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, 19.261, 19.261, -8.822], 'output': {'model1': 1, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -101.122], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -28.855, -28.855, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, 16.351], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, -54.972], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -44.894, -44.894, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -44.894, -44.894, -54.972], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, 3.222, 3.222, 150.607], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 268.08], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 230.321], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, -50.777], 'output': {'model1': 1, 'model2': 1}}, {'input': [158.151, -44.894, -44.894, 58.306], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 200.952], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 35.299, 35.299, 24.742], 'output': {'model1': 1, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -96.927], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 54.111], 'output': {'model1': 0, 'model2': 1}}, {'input': [75.463, 3.222, 3.222, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -60.932, -60.932, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -12.817, -12.817, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, 104.456], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 67.376, 67.376, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 131.531, 131.531, 24.742], 'output': {'model1': 1, 'model2': 1}}, {'input': [75.463, -44.894, -44.894, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [134.526, -76.971, -76.971, -54.972], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, -28.855, -28.855, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 51.338, 51.338, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, 221.93], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 117.043], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -44.894, -44.894, -50.777], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 51.338, 51.338, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -28.855, -28.855, -84.34], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, 54.111], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -28.855, -28.855, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, 19.261, 19.261, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 0, 'model2': 1}}, {'input': [51.838, 19.261, 19.261, 158.998], 'output': {'model1': 0, 'model2': 0}}]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "id": "bb201778-2afa-4988-8889-8f74b370826d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 52,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "verb_data3 == verb_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 60,
   "id": "39223733-e5f8-4010-b78f-3c606123015a",
   "metadata": {},
   "outputs": [],
   "source": [
    "verb_data4 = [{'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 67.376, 67.376, -25.604], 'output': {'model1': 1, 'model2': 1}}, {'input': [134.526, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, 171.584], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 612.688, 612.688, 268.08], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -12.817, -12.817, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 179.975], 'output': {'model1': 0, 'model2': 0}}, {'input': [358.964, -76.971, -76.971, 24.742], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [193.588, -12.817, -12.817, 62.501], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 131.531, 131.531, 217.734], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, -54.972], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, -25.604], 'output': {'model1': 1, 'model2': 0}}, {'input': [99.088, 35.299, 35.299, 255.494], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -28.855, -28.855, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, 188.366], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 99.453, 99.453, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 24.742], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 158.998], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, 19.261, 19.261, 226.125], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [51.838, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -12.817, -12.817, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 150.607], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, -126.295], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 99.453, 99.453, -0.431], 'output': {'model1': 1, 'model2': 1}}, {'input': [-101.725, 19.261, 19.261, 96.065], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, 45.72], 'output': {'model1': 1, 'model2': 1}}, {'input': [-19.037, -60.932, -60.932, -75.95], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 175.78], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, -84.34], 'output': {'model1': 1, 'model2': 1}}, {'input': [16.4, -44.894, -44.894, 175.78], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-7.225, 51.338, 51.338, 83.479], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, 247.103], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [-78.1, 3.222, 3.222, -54.972], 'output': {'model1': 1, 'model2': 1}}, {'input': [134.526, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -28.855, -28.855, 75.088], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -44.894, -44.894, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -44.894, -44.894, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -12.817, -12.817, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -96.927], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, -60.932, -60.932, -105.318], 'output': {'model1': 1, 'model2': 0}}, {'input': [16.4, 3.222, 3.222, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, -17.213], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -60.932, -60.932, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, -42.386], 'output': {'model1': 0, 'model2': 0}}, {'input': [40.026, -44.894, -44.894, -75.95], 'output': {'model1': 1, 'model2': 1}}, {'input': [-66.287, 99.453, 99.453, 226.125], 'output': {'model1': 0, 'model2': 0}}, {'input': [-54.475, 131.531, 131.531, 217.734], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 83.415, 83.415, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-78.1, -28.855, -28.855, -21.408], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, 67.376, 67.376, 62.501], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 83.415, 83.415, -25.604], 'output': {'model1': 1, 'model2': 0}}, {'input': [-113.537, 35.299, 35.299, 104.456], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 163.608, 163.608, 230.321], 'output': {'model1': 1, 'model2': 0}}, {'input': [75.463, -60.932, -60.932, 150.607], 'output': {'model1': 0, 'model2': 0}}, {'input': [-30.85, 131.531, 131.531, 58.306], 'output': {'model1': 1, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -96.927], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, 35.299, 35.299, 125.434], 'output': {'model1': 0, 'model2': 0}}, {'input': [-19.037, 147.569, 147.569, 179.975], 'output': {'model1': 1, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -28.855, -28.855, 96.065], 'output': {'model1': 0, 'model2': 0}}, {'input': [-19.037, 51.338, 51.338, 125.434], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, -8.822], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, -101.122], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -28.855, -28.855, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, 16.351], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -60.932, -60.932, -54.972], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 35.299, 35.299, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -44.894, -44.894, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -44.894, -44.894, -54.972], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, 3.222, 3.222, 150.607], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 100.261], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -60.932, -60.932, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 268.08], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 230.321], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 3.222, 3.222, -50.777], 'output': {'model1': 1, 'model2': 1}}, {'input': [158.151, -44.894, -44.894, 58.306], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 19.261, 19.261, 200.952], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 35.299, 35.299, 24.742], 'output': {'model1': 0, 'model2': 1}}, {'input': [-89.912, -60.932, -60.932, -96.927], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, -76.971, -76.971, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, 99.453, 99.453, 54.111], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 3.222, 3.222, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -60.932, -60.932, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -12.817, -12.817, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, 104.456], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 67.376, 67.376, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 131.531, 131.531, 24.742], 'output': {'model1': 1, 'model2': 1}}, {'input': [75.463, -44.894, -44.894, 66.697], 'output': {'model1': 0, 'model2': 0}}, {'input': [134.526, -76.971, -76.971, -54.972], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -75.95], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, -76.971, -76.971, -96.927], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -12.817, -12.817, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [16.4, 51.338, 51.338, -4.626], 'output': {'model1': 0, 'model2': 0}}, {'input': [75.463, 19.261, 19.261, 221.93], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -44.894, -44.894, 117.043], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -60.932, -60.932, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -44.894, -44.894, -50.777], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [-66.287, 51.338, 51.338, -25.604], 'output': {'model1': 0, 'model2': 1}}, {'input': [-66.287, -28.855, -28.855, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -60.932, -60.932, 28.938], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, 3.222, 3.222, 54.111], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -76.971, -76.971, -134.686], 'output': {'model1': 1, 'model2': 0}}, {'input': [158.151, -76.971, -76.971, -46.581], 'output': {'model1': 0, 'model2': 0}}, {'input': [-89.912, -28.855, -28.855, 3.765], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -28.855, -28.855, -25.604], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, -76.971, -76.971, -84.34], 'output': {'model1': 0, 'model2': 0}}, {'input': [51.838, 19.261, 19.261, -33.995], 'output': {'model1': 0, 'model2': 0}}, {'input': [-66.287, -76.971, -76.971, -126.295], 'output': {'model1': 1, 'model2': 0}}, {'input': [51.838, 19.261, 19.261, 158.998], 'output': {'model1': 0, 'model2': 0}}]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "id": "51e52657-1843-423e-8dbe-838b73092b21",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 61,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "verb_data4 == verb_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2271873b-e486-4bef-a93c-cff2b35f0fbc",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "72b68c4c-a260-4061-b955-f481176792a4",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ead40791-4fef-42d9-b745-656e63cceb61",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.4"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
