{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "7ea9fe69",
   "metadata": {
    "column": 1,
    "index": 1
   },
   "source": [
    "# Section 1: Imports & Functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "67d8f204",
   "metadata": {
    "column": 1,
    "index": 2
   },
   "outputs": [],
   "source": [
    "# Library Import Statements\n",
    "\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "from sklearn.preprocessing import normalize\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "eeea4b01",
   "metadata": {
    "column": 1,
    "index": 3
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tau1</th>\n",
       "      <th>tau2</th>\n",
       "      <th>tau3</th>\n",
       "      <th>tau4</th>\n",
       "      <th>p1</th>\n",
       "      <th>p2</th>\n",
       "      <th>p3</th>\n",
       "      <th>p4</th>\n",
       "      <th>g1</th>\n",
       "      <th>g2</th>\n",
       "      <th>g3</th>\n",
       "      <th>g4</th>\n",
       "      <th>stab</th>\n",
       "      <th>stabf</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2.959060</td>\n",
       "      <td>3.079885</td>\n",
       "      <td>8.381025</td>\n",
       "      <td>9.780754</td>\n",
       "      <td>3.763085</td>\n",
       "      <td>-0.782604</td>\n",
       "      <td>-1.257395</td>\n",
       "      <td>-1.723086</td>\n",
       "      <td>0.650456</td>\n",
       "      <td>0.859578</td>\n",
       "      <td>0.887445</td>\n",
       "      <td>0.958034</td>\n",
       "      <td>0.055347</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>9.304097</td>\n",
       "      <td>4.902524</td>\n",
       "      <td>3.047541</td>\n",
       "      <td>1.369357</td>\n",
       "      <td>5.067812</td>\n",
       "      <td>-1.940058</td>\n",
       "      <td>-1.872742</td>\n",
       "      <td>-1.255012</td>\n",
       "      <td>0.413441</td>\n",
       "      <td>0.862414</td>\n",
       "      <td>0.562139</td>\n",
       "      <td>0.781760</td>\n",
       "      <td>-0.005957</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>8.971707</td>\n",
       "      <td>8.848428</td>\n",
       "      <td>3.046479</td>\n",
       "      <td>1.214518</td>\n",
       "      <td>3.405158</td>\n",
       "      <td>-1.207456</td>\n",
       "      <td>-1.277210</td>\n",
       "      <td>-0.920492</td>\n",
       "      <td>0.163041</td>\n",
       "      <td>0.766689</td>\n",
       "      <td>0.839444</td>\n",
       "      <td>0.109853</td>\n",
       "      <td>0.003471</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.716415</td>\n",
       "      <td>7.669600</td>\n",
       "      <td>4.486641</td>\n",
       "      <td>2.340563</td>\n",
       "      <td>3.963791</td>\n",
       "      <td>-1.027473</td>\n",
       "      <td>-1.938944</td>\n",
       "      <td>-0.997374</td>\n",
       "      <td>0.446209</td>\n",
       "      <td>0.976744</td>\n",
       "      <td>0.929381</td>\n",
       "      <td>0.362718</td>\n",
       "      <td>0.028871</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>3.134112</td>\n",
       "      <td>7.608772</td>\n",
       "      <td>4.943759</td>\n",
       "      <td>9.857573</td>\n",
       "      <td>3.525811</td>\n",
       "      <td>-1.125531</td>\n",
       "      <td>-1.845975</td>\n",
       "      <td>-0.554305</td>\n",
       "      <td>0.797110</td>\n",
       "      <td>0.455450</td>\n",
       "      <td>0.656947</td>\n",
       "      <td>0.820923</td>\n",
       "      <td>0.049860</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       tau1      tau2      tau3      tau4        p1        p2        p3  \\\n",
       "0  2.959060  3.079885  8.381025  9.780754  3.763085 -0.782604 -1.257395   \n",
       "1  9.304097  4.902524  3.047541  1.369357  5.067812 -1.940058 -1.872742   \n",
       "2  8.971707  8.848428  3.046479  1.214518  3.405158 -1.207456 -1.277210   \n",
       "3  0.716415  7.669600  4.486641  2.340563  3.963791 -1.027473 -1.938944   \n",
       "4  3.134112  7.608772  4.943759  9.857573  3.525811 -1.125531 -1.845975   \n",
       "\n",
       "         p4        g1        g2        g3        g4      stab     stabf  \n",
       "0 -1.723086  0.650456  0.859578  0.887445  0.958034  0.055347  unstable  \n",
       "1 -1.255012  0.413441  0.862414  0.562139  0.781760 -0.005957    stable  \n",
       "2 -0.920492  0.163041  0.766689  0.839444  0.109853  0.003471  unstable  \n",
       "3 -0.997374  0.446209  0.976744  0.929381  0.362718  0.028871  unstable  \n",
       "4 -0.554305  0.797110  0.455450  0.656947  0.820923  0.049860  unstable  "
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Data Import Cell\n",
    "url = \"http://archive.ics.uci.edu/ml/machine-learning-databases/00471/Data_for_UCI_named.csv\"\n",
    "data = pd.read_csv(url, sep=\",\")\n",
    "data.head()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "9ef2b0af",
   "metadata": {
    "column": 2,
    "index": 4
   },
   "source": [
    "# Section 2: 1st Analysis"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "50a4c8ba",
   "metadata": {
    "column": 2,
    "index": 5
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tau1</th>\n",
       "      <th>tau2</th>\n",
       "      <th>tau3</th>\n",
       "      <th>tau4</th>\n",
       "      <th>p1</th>\n",
       "      <th>p2</th>\n",
       "      <th>p3</th>\n",
       "      <th>p4</th>\n",
       "      <th>g1</th>\n",
       "      <th>g2</th>\n",
       "      <th>g3</th>\n",
       "      <th>g4</th>\n",
       "      <th>stab</th>\n",
       "      <th>stabf</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2.959060</td>\n",
       "      <td>3.079885</td>\n",
       "      <td>8.381025</td>\n",
       "      <td>9.780754</td>\n",
       "      <td>3.763085</td>\n",
       "      <td>-0.782604</td>\n",
       "      <td>-1.257395</td>\n",
       "      <td>-1.723086</td>\n",
       "      <td>0.650456</td>\n",
       "      <td>0.859578</td>\n",
       "      <td>0.887445</td>\n",
       "      <td>0.958034</td>\n",
       "      <td>0.055347</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>9.304097</td>\n",
       "      <td>4.902524</td>\n",
       "      <td>3.047541</td>\n",
       "      <td>1.369357</td>\n",
       "      <td>5.067812</td>\n",
       "      <td>-1.940058</td>\n",
       "      <td>-1.872742</td>\n",
       "      <td>-1.255012</td>\n",
       "      <td>0.413441</td>\n",
       "      <td>0.862414</td>\n",
       "      <td>0.562139</td>\n",
       "      <td>0.781760</td>\n",
       "      <td>-0.005957</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>8.971707</td>\n",
       "      <td>8.848428</td>\n",
       "      <td>3.046479</td>\n",
       "      <td>1.214518</td>\n",
       "      <td>3.405158</td>\n",
       "      <td>-1.207456</td>\n",
       "      <td>-1.277210</td>\n",
       "      <td>-0.920492</td>\n",
       "      <td>0.163041</td>\n",
       "      <td>0.766689</td>\n",
       "      <td>0.839444</td>\n",
       "      <td>0.109853</td>\n",
       "      <td>0.003471</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.716415</td>\n",
       "      <td>7.669600</td>\n",
       "      <td>4.486641</td>\n",
       "      <td>2.340563</td>\n",
       "      <td>3.963791</td>\n",
       "      <td>-1.027473</td>\n",
       "      <td>-1.938944</td>\n",
       "      <td>-0.997374</td>\n",
       "      <td>0.446209</td>\n",
       "      <td>0.976744</td>\n",
       "      <td>0.929381</td>\n",
       "      <td>0.362718</td>\n",
       "      <td>0.028871</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>3.134112</td>\n",
       "      <td>7.608772</td>\n",
       "      <td>4.943759</td>\n",
       "      <td>9.857573</td>\n",
       "      <td>3.525811</td>\n",
       "      <td>-1.125531</td>\n",
       "      <td>-1.845975</td>\n",
       "      <td>-0.554305</td>\n",
       "      <td>0.797110</td>\n",
       "      <td>0.455450</td>\n",
       "      <td>0.656947</td>\n",
       "      <td>0.820923</td>\n",
       "      <td>0.049860</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4995</th>\n",
       "      <td>3.592940</td>\n",
       "      <td>8.130493</td>\n",
       "      <td>3.270724</td>\n",
       "      <td>8.075292</td>\n",
       "      <td>4.772430</td>\n",
       "      <td>-1.458529</td>\n",
       "      <td>-1.690274</td>\n",
       "      <td>-1.623627</td>\n",
       "      <td>0.210123</td>\n",
       "      <td>0.683625</td>\n",
       "      <td>0.159779</td>\n",
       "      <td>0.344948</td>\n",
       "      <td>0.011499</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4996</th>\n",
       "      <td>7.656651</td>\n",
       "      <td>6.411748</td>\n",
       "      <td>5.655960</td>\n",
       "      <td>6.045712</td>\n",
       "      <td>3.193900</td>\n",
       "      <td>-0.918944</td>\n",
       "      <td>-1.377013</td>\n",
       "      <td>-0.897943</td>\n",
       "      <td>0.443617</td>\n",
       "      <td>0.490799</td>\n",
       "      <td>0.988511</td>\n",
       "      <td>0.788984</td>\n",
       "      <td>0.086436</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4997</th>\n",
       "      <td>1.069438</td>\n",
       "      <td>6.581439</td>\n",
       "      <td>1.230892</td>\n",
       "      <td>9.937483</td>\n",
       "      <td>3.756828</td>\n",
       "      <td>-1.524720</td>\n",
       "      <td>-0.516322</td>\n",
       "      <td>-1.715786</td>\n",
       "      <td>0.501101</td>\n",
       "      <td>0.381437</td>\n",
       "      <td>0.773236</td>\n",
       "      <td>0.822149</td>\n",
       "      <td>-0.025390</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4998</th>\n",
       "      <td>4.629745</td>\n",
       "      <td>8.353612</td>\n",
       "      <td>8.119304</td>\n",
       "      <td>8.600847</td>\n",
       "      <td>2.960941</td>\n",
       "      <td>-1.424327</td>\n",
       "      <td>-0.890685</td>\n",
       "      <td>-0.645929</td>\n",
       "      <td>0.383265</td>\n",
       "      <td>0.241701</td>\n",
       "      <td>0.609101</td>\n",
       "      <td>0.756135</td>\n",
       "      <td>0.052382</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4999</th>\n",
       "      <td>0.754512</td>\n",
       "      <td>9.723392</td>\n",
       "      <td>9.264871</td>\n",
       "      <td>1.415836</td>\n",
       "      <td>5.029876</td>\n",
       "      <td>-1.281568</td>\n",
       "      <td>-1.946921</td>\n",
       "      <td>-1.801387</td>\n",
       "      <td>0.448670</td>\n",
       "      <td>0.413843</td>\n",
       "      <td>0.273108</td>\n",
       "      <td>0.251181</td>\n",
       "      <td>-0.036986</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5000 rows × 14 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          tau1      tau2      tau3      tau4        p1        p2        p3  \\\n",
       "0     2.959060  3.079885  8.381025  9.780754  3.763085 -0.782604 -1.257395   \n",
       "1     9.304097  4.902524  3.047541  1.369357  5.067812 -1.940058 -1.872742   \n",
       "2     8.971707  8.848428  3.046479  1.214518  3.405158 -1.207456 -1.277210   \n",
       "3     0.716415  7.669600  4.486641  2.340563  3.963791 -1.027473 -1.938944   \n",
       "4     3.134112  7.608772  4.943759  9.857573  3.525811 -1.125531 -1.845975   \n",
       "...        ...       ...       ...       ...       ...       ...       ...   \n",
       "4995  3.592940  8.130493  3.270724  8.075292  4.772430 -1.458529 -1.690274   \n",
       "4996  7.656651  6.411748  5.655960  6.045712  3.193900 -0.918944 -1.377013   \n",
       "4997  1.069438  6.581439  1.230892  9.937483  3.756828 -1.524720 -0.516322   \n",
       "4998  4.629745  8.353612  8.119304  8.600847  2.960941 -1.424327 -0.890685   \n",
       "4999  0.754512  9.723392  9.264871  1.415836  5.029876 -1.281568 -1.946921   \n",
       "\n",
       "            p4        g1        g2        g3        g4      stab     stabf  \n",
       "0    -1.723086  0.650456  0.859578  0.887445  0.958034  0.055347  unstable  \n",
       "1    -1.255012  0.413441  0.862414  0.562139  0.781760 -0.005957    stable  \n",
       "2    -0.920492  0.163041  0.766689  0.839444  0.109853  0.003471  unstable  \n",
       "3    -0.997374  0.446209  0.976744  0.929381  0.362718  0.028871  unstable  \n",
       "4    -0.554305  0.797110  0.455450  0.656947  0.820923  0.049860  unstable  \n",
       "...        ...       ...       ...       ...       ...       ...       ...  \n",
       "4995 -1.623627  0.210123  0.683625  0.159779  0.344948  0.011499  unstable  \n",
       "4996 -0.897943  0.443617  0.490799  0.988511  0.788984  0.086436  unstable  \n",
       "4997 -1.715786  0.501101  0.381437  0.773236  0.822149 -0.025390    stable  \n",
       "4998 -0.645929  0.383265  0.241701  0.609101  0.756135  0.052382  unstable  \n",
       "4999 -1.801387  0.448670  0.413843  0.273108  0.251181 -0.036986    stable  \n",
       "\n",
       "[5000 rows x 14 columns]"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "my_data = data.head(5000)\n",
    "my_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "f8ffd9ad",
   "metadata": {
    "column": 3,
    "index": 6
   },
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "C:\\Users\\harde\\AppData\\Local\\Programs\\Python\\Python39\\lib\\site-packages\\pandas\\core\\indexing.py:1817: SettingWithCopyWarning: \n",
      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
      "Try using .loc[row_indexer,col_indexer] = value instead\n",
      "\n",
      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
      "  self._setitem_single_column(loc, value, pi)\n",
      "C:\\Users\\harde\\AppData\\Local\\Temp\\ipykernel_21872\\9913949.py:8: SettingWithCopyWarning: \n",
      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
      "Try using .loc[row_indexer,col_indexer] = value instead\n",
      "\n",
      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
      "  my_data['stabf'] = pd.to_numeric(my_data['stabf'])\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tau1</th>\n",
       "      <th>tau2</th>\n",
       "      <th>tau3</th>\n",
       "      <th>tau4</th>\n",
       "      <th>p1</th>\n",
       "      <th>p2</th>\n",
       "      <th>p3</th>\n",
       "      <th>p4</th>\n",
       "      <th>g1</th>\n",
       "      <th>g2</th>\n",
       "      <th>g3</th>\n",
       "      <th>g4</th>\n",
       "      <th>stab</th>\n",
       "      <th>stabf</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2.959060</td>\n",
       "      <td>3.079885</td>\n",
       "      <td>8.381025</td>\n",
       "      <td>9.780754</td>\n",
       "      <td>3.763085</td>\n",
       "      <td>-0.782604</td>\n",
       "      <td>-1.257395</td>\n",
       "      <td>-1.723086</td>\n",
       "      <td>0.650456</td>\n",
       "      <td>0.859578</td>\n",
       "      <td>0.887445</td>\n",
       "      <td>0.958034</td>\n",
       "      <td>0.055347</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>9.304097</td>\n",
       "      <td>4.902524</td>\n",
       "      <td>3.047541</td>\n",
       "      <td>1.369357</td>\n",
       "      <td>5.067812</td>\n",
       "      <td>-1.940058</td>\n",
       "      <td>-1.872742</td>\n",
       "      <td>-1.255012</td>\n",
       "      <td>0.413441</td>\n",
       "      <td>0.862414</td>\n",
       "      <td>0.562139</td>\n",
       "      <td>0.781760</td>\n",
       "      <td>-0.005957</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>8.971707</td>\n",
       "      <td>8.848428</td>\n",
       "      <td>3.046479</td>\n",
       "      <td>1.214518</td>\n",
       "      <td>3.405158</td>\n",
       "      <td>-1.207456</td>\n",
       "      <td>-1.277210</td>\n",
       "      <td>-0.920492</td>\n",
       "      <td>0.163041</td>\n",
       "      <td>0.766689</td>\n",
       "      <td>0.839444</td>\n",
       "      <td>0.109853</td>\n",
       "      <td>0.003471</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.716415</td>\n",
       "      <td>7.669600</td>\n",
       "      <td>4.486641</td>\n",
       "      <td>2.340563</td>\n",
       "      <td>3.963791</td>\n",
       "      <td>-1.027473</td>\n",
       "      <td>-1.938944</td>\n",
       "      <td>-0.997374</td>\n",
       "      <td>0.446209</td>\n",
       "      <td>0.976744</td>\n",
       "      <td>0.929381</td>\n",
       "      <td>0.362718</td>\n",
       "      <td>0.028871</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>3.134112</td>\n",
       "      <td>7.608772</td>\n",
       "      <td>4.943759</td>\n",
       "      <td>9.857573</td>\n",
       "      <td>3.525811</td>\n",
       "      <td>-1.125531</td>\n",
       "      <td>-1.845975</td>\n",
       "      <td>-0.554305</td>\n",
       "      <td>0.797110</td>\n",
       "      <td>0.455450</td>\n",
       "      <td>0.656947</td>\n",
       "      <td>0.820923</td>\n",
       "      <td>0.049860</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4995</th>\n",
       "      <td>3.592940</td>\n",
       "      <td>8.130493</td>\n",
       "      <td>3.270724</td>\n",
       "      <td>8.075292</td>\n",
       "      <td>4.772430</td>\n",
       "      <td>-1.458529</td>\n",
       "      <td>-1.690274</td>\n",
       "      <td>-1.623627</td>\n",
       "      <td>0.210123</td>\n",
       "      <td>0.683625</td>\n",
       "      <td>0.159779</td>\n",
       "      <td>0.344948</td>\n",
       "      <td>0.011499</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4996</th>\n",
       "      <td>7.656651</td>\n",
       "      <td>6.411748</td>\n",
       "      <td>5.655960</td>\n",
       "      <td>6.045712</td>\n",
       "      <td>3.193900</td>\n",
       "      <td>-0.918944</td>\n",
       "      <td>-1.377013</td>\n",
       "      <td>-0.897943</td>\n",
       "      <td>0.443617</td>\n",
       "      <td>0.490799</td>\n",
       "      <td>0.988511</td>\n",
       "      <td>0.788984</td>\n",
       "      <td>0.086436</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4997</th>\n",
       "      <td>1.069438</td>\n",
       "      <td>6.581439</td>\n",
       "      <td>1.230892</td>\n",
       "      <td>9.937483</td>\n",
       "      <td>3.756828</td>\n",
       "      <td>-1.524720</td>\n",
       "      <td>-0.516322</td>\n",
       "      <td>-1.715786</td>\n",
       "      <td>0.501101</td>\n",
       "      <td>0.381437</td>\n",
       "      <td>0.773236</td>\n",
       "      <td>0.822149</td>\n",
       "      <td>-0.025390</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4998</th>\n",
       "      <td>4.629745</td>\n",
       "      <td>8.353612</td>\n",
       "      <td>8.119304</td>\n",
       "      <td>8.600847</td>\n",
       "      <td>2.960941</td>\n",
       "      <td>-1.424327</td>\n",
       "      <td>-0.890685</td>\n",
       "      <td>-0.645929</td>\n",
       "      <td>0.383265</td>\n",
       "      <td>0.241701</td>\n",
       "      <td>0.609101</td>\n",
       "      <td>0.756135</td>\n",
       "      <td>0.052382</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4999</th>\n",
       "      <td>0.754512</td>\n",
       "      <td>9.723392</td>\n",
       "      <td>9.264871</td>\n",
       "      <td>1.415836</td>\n",
       "      <td>5.029876</td>\n",
       "      <td>-1.281568</td>\n",
       "      <td>-1.946921</td>\n",
       "      <td>-1.801387</td>\n",
       "      <td>0.448670</td>\n",
       "      <td>0.413843</td>\n",
       "      <td>0.273108</td>\n",
       "      <td>0.251181</td>\n",
       "      <td>-0.036986</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5000 rows × 14 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          tau1      tau2      tau3      tau4        p1        p2        p3  \\\n",
       "0     2.959060  3.079885  8.381025  9.780754  3.763085 -0.782604 -1.257395   \n",
       "1     9.304097  4.902524  3.047541  1.369357  5.067812 -1.940058 -1.872742   \n",
       "2     8.971707  8.848428  3.046479  1.214518  3.405158 -1.207456 -1.277210   \n",
       "3     0.716415  7.669600  4.486641  2.340563  3.963791 -1.027473 -1.938944   \n",
       "4     3.134112  7.608772  4.943759  9.857573  3.525811 -1.125531 -1.845975   \n",
       "...        ...       ...       ...       ...       ...       ...       ...   \n",
       "4995  3.592940  8.130493  3.270724  8.075292  4.772430 -1.458529 -1.690274   \n",
       "4996  7.656651  6.411748  5.655960  6.045712  3.193900 -0.918944 -1.377013   \n",
       "4997  1.069438  6.581439  1.230892  9.937483  3.756828 -1.524720 -0.516322   \n",
       "4998  4.629745  8.353612  8.119304  8.600847  2.960941 -1.424327 -0.890685   \n",
       "4999  0.754512  9.723392  9.264871  1.415836  5.029876 -1.281568 -1.946921   \n",
       "\n",
       "            p4        g1        g2        g3        g4      stab  stabf  \n",
       "0    -1.723086  0.650456  0.859578  0.887445  0.958034  0.055347      1  \n",
       "1    -1.255012  0.413441  0.862414  0.562139  0.781760 -0.005957      0  \n",
       "2    -0.920492  0.163041  0.766689  0.839444  0.109853  0.003471      1  \n",
       "3    -0.997374  0.446209  0.976744  0.929381  0.362718  0.028871      1  \n",
       "4    -0.554305  0.797110  0.455450  0.656947  0.820923  0.049860      1  \n",
       "...        ...       ...       ...       ...       ...       ...    ...  \n",
       "4995 -1.623627  0.210123  0.683625  0.159779  0.344948  0.011499      1  \n",
       "4996 -0.897943  0.443617  0.490799  0.988511  0.788984  0.086436      1  \n",
       "4997 -1.715786  0.501101  0.381437  0.773236  0.822149 -0.025390      0  \n",
       "4998 -0.645929  0.383265  0.241701  0.609101  0.756135  0.052382      1  \n",
       "4999 -1.801387  0.448670  0.413843  0.273108  0.251181 -0.036986      0  \n",
       "\n",
       "[5000 rows x 14 columns]"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Convert Class names to numbers\n",
    "# 0 = stable\n",
    "# 1 = unstable\n",
    "\n",
    "# assign values to the dependent variable\n",
    "my_data.loc[(my_data['stabf'] == 'stable'), 'stabf'] = 0\n",
    "my_data.loc[(my_data['stabf'] == 'unstable'), 'stabf'] = 1\n",
    "my_data['stabf'] = pd.to_numeric(my_data['stabf'])\n",
    "my_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "6ecdac84",
   "metadata": {
    "column": 3,
    "index": 7,
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tau1</th>\n",
       "      <th>tau2</th>\n",
       "      <th>tau3</th>\n",
       "      <th>tau4</th>\n",
       "      <th>p1</th>\n",
       "      <th>p2</th>\n",
       "      <th>p3</th>\n",
       "      <th>p4</th>\n",
       "      <th>g1</th>\n",
       "      <th>g2</th>\n",
       "      <th>g3</th>\n",
       "      <th>g4</th>\n",
       "      <th>stab</th>\n",
       "      <th>stabf</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>3500</th>\n",
       "      <td>7.592223</td>\n",
       "      <td>1.389509</td>\n",
       "      <td>7.285896</td>\n",
       "      <td>6.031028</td>\n",
       "      <td>4.901480</td>\n",
       "      <td>-1.809328</td>\n",
       "      <td>-1.536639</td>\n",
       "      <td>-1.555512</td>\n",
       "      <td>0.444016</td>\n",
       "      <td>0.469558</td>\n",
       "      <td>0.559769</td>\n",
       "      <td>0.170529</td>\n",
       "      <td>0.001593</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3501</th>\n",
       "      <td>9.203739</td>\n",
       "      <td>3.031134</td>\n",
       "      <td>2.742088</td>\n",
       "      <td>7.318112</td>\n",
       "      <td>4.379546</td>\n",
       "      <td>-1.160296</td>\n",
       "      <td>-1.374819</td>\n",
       "      <td>-1.844431</td>\n",
       "      <td>0.322139</td>\n",
       "      <td>0.945597</td>\n",
       "      <td>0.786776</td>\n",
       "      <td>0.527852</td>\n",
       "      <td>0.015995</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3502</th>\n",
       "      <td>4.016004</td>\n",
       "      <td>8.501127</td>\n",
       "      <td>5.345373</td>\n",
       "      <td>6.943443</td>\n",
       "      <td>2.952986</td>\n",
       "      <td>-0.535994</td>\n",
       "      <td>-1.375817</td>\n",
       "      <td>-1.041175</td>\n",
       "      <td>0.662382</td>\n",
       "      <td>0.300356</td>\n",
       "      <td>0.251775</td>\n",
       "      <td>0.559976</td>\n",
       "      <td>0.027832</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3503</th>\n",
       "      <td>1.568860</td>\n",
       "      <td>2.338635</td>\n",
       "      <td>7.562933</td>\n",
       "      <td>0.931341</td>\n",
       "      <td>3.180046</td>\n",
       "      <td>-1.887828</td>\n",
       "      <td>-0.673774</td>\n",
       "      <td>-0.618444</td>\n",
       "      <td>0.321079</td>\n",
       "      <td>0.081876</td>\n",
       "      <td>0.298656</td>\n",
       "      <td>0.078052</td>\n",
       "      <td>-0.051548</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3504</th>\n",
       "      <td>8.906023</td>\n",
       "      <td>4.356134</td>\n",
       "      <td>4.086695</td>\n",
       "      <td>1.396348</td>\n",
       "      <td>4.998403</td>\n",
       "      <td>-1.232689</td>\n",
       "      <td>-1.910843</td>\n",
       "      <td>-1.854870</td>\n",
       "      <td>0.143437</td>\n",
       "      <td>0.556369</td>\n",
       "      <td>0.929642</td>\n",
       "      <td>0.686855</td>\n",
       "      <td>0.007881</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4995</th>\n",
       "      <td>3.592940</td>\n",
       "      <td>8.130493</td>\n",
       "      <td>3.270724</td>\n",
       "      <td>8.075292</td>\n",
       "      <td>4.772430</td>\n",
       "      <td>-1.458529</td>\n",
       "      <td>-1.690274</td>\n",
       "      <td>-1.623627</td>\n",
       "      <td>0.210123</td>\n",
       "      <td>0.683625</td>\n",
       "      <td>0.159779</td>\n",
       "      <td>0.344948</td>\n",
       "      <td>0.011499</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4996</th>\n",
       "      <td>7.656651</td>\n",
       "      <td>6.411748</td>\n",
       "      <td>5.655960</td>\n",
       "      <td>6.045712</td>\n",
       "      <td>3.193900</td>\n",
       "      <td>-0.918944</td>\n",
       "      <td>-1.377013</td>\n",
       "      <td>-0.897943</td>\n",
       "      <td>0.443617</td>\n",
       "      <td>0.490799</td>\n",
       "      <td>0.988511</td>\n",
       "      <td>0.788984</td>\n",
       "      <td>0.086436</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4997</th>\n",
       "      <td>1.069438</td>\n",
       "      <td>6.581439</td>\n",
       "      <td>1.230892</td>\n",
       "      <td>9.937483</td>\n",
       "      <td>3.756828</td>\n",
       "      <td>-1.524720</td>\n",
       "      <td>-0.516322</td>\n",
       "      <td>-1.715786</td>\n",
       "      <td>0.501101</td>\n",
       "      <td>0.381437</td>\n",
       "      <td>0.773236</td>\n",
       "      <td>0.822149</td>\n",
       "      <td>-0.025390</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4998</th>\n",
       "      <td>4.629745</td>\n",
       "      <td>8.353612</td>\n",
       "      <td>8.119304</td>\n",
       "      <td>8.600847</td>\n",
       "      <td>2.960941</td>\n",
       "      <td>-1.424327</td>\n",
       "      <td>-0.890685</td>\n",
       "      <td>-0.645929</td>\n",
       "      <td>0.383265</td>\n",
       "      <td>0.241701</td>\n",
       "      <td>0.609101</td>\n",
       "      <td>0.756135</td>\n",
       "      <td>0.052382</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4999</th>\n",
       "      <td>0.754512</td>\n",
       "      <td>9.723392</td>\n",
       "      <td>9.264871</td>\n",
       "      <td>1.415836</td>\n",
       "      <td>5.029876</td>\n",
       "      <td>-1.281568</td>\n",
       "      <td>-1.946921</td>\n",
       "      <td>-1.801387</td>\n",
       "      <td>0.448670</td>\n",
       "      <td>0.413843</td>\n",
       "      <td>0.273108</td>\n",
       "      <td>0.251181</td>\n",
       "      <td>-0.036986</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1500 rows × 14 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          tau1      tau2      tau3      tau4        p1        p2        p3  \\\n",
       "3500  7.592223  1.389509  7.285896  6.031028  4.901480 -1.809328 -1.536639   \n",
       "3501  9.203739  3.031134  2.742088  7.318112  4.379546 -1.160296 -1.374819   \n",
       "3502  4.016004  8.501127  5.345373  6.943443  2.952986 -0.535994 -1.375817   \n",
       "3503  1.568860  2.338635  7.562933  0.931341  3.180046 -1.887828 -0.673774   \n",
       "3504  8.906023  4.356134  4.086695  1.396348  4.998403 -1.232689 -1.910843   \n",
       "...        ...       ...       ...       ...       ...       ...       ...   \n",
       "4995  3.592940  8.130493  3.270724  8.075292  4.772430 -1.458529 -1.690274   \n",
       "4996  7.656651  6.411748  5.655960  6.045712  3.193900 -0.918944 -1.377013   \n",
       "4997  1.069438  6.581439  1.230892  9.937483  3.756828 -1.524720 -0.516322   \n",
       "4998  4.629745  8.353612  8.119304  8.600847  2.960941 -1.424327 -0.890685   \n",
       "4999  0.754512  9.723392  9.264871  1.415836  5.029876 -1.281568 -1.946921   \n",
       "\n",
       "            p4        g1        g2        g3        g4      stab  stabf  \n",
       "3500 -1.555512  0.444016  0.469558  0.559769  0.170529  0.001593      1  \n",
       "3501 -1.844431  0.322139  0.945597  0.786776  0.527852  0.015995      1  \n",
       "3502 -1.041175  0.662382  0.300356  0.251775  0.559976  0.027832      1  \n",
       "3503 -0.618444  0.321079  0.081876  0.298656  0.078052 -0.051548      0  \n",
       "3504 -1.854870  0.143437  0.556369  0.929642  0.686855  0.007881      1  \n",
       "...        ...       ...       ...       ...       ...       ...    ...  \n",
       "4995 -1.623627  0.210123  0.683625  0.159779  0.344948  0.011499      1  \n",
       "4996 -0.897943  0.443617  0.490799  0.988511  0.788984  0.086436      1  \n",
       "4997 -1.715786  0.501101  0.381437  0.773236  0.822149 -0.025390      0  \n",
       "4998 -0.645929  0.383265  0.241701  0.609101  0.756135  0.052382      1  \n",
       "4999 -1.801387  0.448670  0.413843  0.273108  0.251181 -0.036986      0  \n",
       "\n",
       "[1500 rows x 14 columns]"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Split dataframe into testing and training sets\n",
    "train_data = my_data.iloc[:3500]\n",
    "test_data = my_data.iloc[3500:]\n",
    "test_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "6ea588de",
   "metadata": {
    "column": 3,
    "index": 8,
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tau1</th>\n",
       "      <th>tau2</th>\n",
       "      <th>tau3</th>\n",
       "      <th>tau4</th>\n",
       "      <th>p1</th>\n",
       "      <th>p2</th>\n",
       "      <th>p3</th>\n",
       "      <th>p4</th>\n",
       "      <th>g1</th>\n",
       "      <th>g2</th>\n",
       "      <th>g3</th>\n",
       "      <th>g4</th>\n",
       "      <th>stab</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>3500</th>\n",
       "      <td>7.592223</td>\n",
       "      <td>1.389509</td>\n",
       "      <td>7.285896</td>\n",
       "      <td>6.031028</td>\n",
       "      <td>4.901480</td>\n",
       "      <td>-1.809328</td>\n",
       "      <td>-1.536639</td>\n",
       "      <td>-1.555512</td>\n",
       "      <td>0.444016</td>\n",
       "      <td>0.469558</td>\n",
       "      <td>0.559769</td>\n",
       "      <td>0.170529</td>\n",
       "      <td>0.001593</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3501</th>\n",
       "      <td>9.203739</td>\n",
       "      <td>3.031134</td>\n",
       "      <td>2.742088</td>\n",
       "      <td>7.318112</td>\n",
       "      <td>4.379546</td>\n",
       "      <td>-1.160296</td>\n",
       "      <td>-1.374819</td>\n",
       "      <td>-1.844431</td>\n",
       "      <td>0.322139</td>\n",
       "      <td>0.945597</td>\n",
       "      <td>0.786776</td>\n",
       "      <td>0.527852</td>\n",
       "      <td>0.015995</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3502</th>\n",
       "      <td>4.016004</td>\n",
       "      <td>8.501127</td>\n",
       "      <td>5.345373</td>\n",
       "      <td>6.943443</td>\n",
       "      <td>2.952986</td>\n",
       "      <td>-0.535994</td>\n",
       "      <td>-1.375817</td>\n",
       "      <td>-1.041175</td>\n",
       "      <td>0.662382</td>\n",
       "      <td>0.300356</td>\n",
       "      <td>0.251775</td>\n",
       "      <td>0.559976</td>\n",
       "      <td>0.027832</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3503</th>\n",
       "      <td>1.568860</td>\n",
       "      <td>2.338635</td>\n",
       "      <td>7.562933</td>\n",
       "      <td>0.931341</td>\n",
       "      <td>3.180046</td>\n",
       "      <td>-1.887828</td>\n",
       "      <td>-0.673774</td>\n",
       "      <td>-0.618444</td>\n",
       "      <td>0.321079</td>\n",
       "      <td>0.081876</td>\n",
       "      <td>0.298656</td>\n",
       "      <td>0.078052</td>\n",
       "      <td>-0.051548</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3504</th>\n",
       "      <td>8.906023</td>\n",
       "      <td>4.356134</td>\n",
       "      <td>4.086695</td>\n",
       "      <td>1.396348</td>\n",
       "      <td>4.998403</td>\n",
       "      <td>-1.232689</td>\n",
       "      <td>-1.910843</td>\n",
       "      <td>-1.854870</td>\n",
       "      <td>0.143437</td>\n",
       "      <td>0.556369</td>\n",
       "      <td>0.929642</td>\n",
       "      <td>0.686855</td>\n",
       "      <td>0.007881</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4995</th>\n",
       "      <td>3.592940</td>\n",
       "      <td>8.130493</td>\n",
       "      <td>3.270724</td>\n",
       "      <td>8.075292</td>\n",
       "      <td>4.772430</td>\n",
       "      <td>-1.458529</td>\n",
       "      <td>-1.690274</td>\n",
       "      <td>-1.623627</td>\n",
       "      <td>0.210123</td>\n",
       "      <td>0.683625</td>\n",
       "      <td>0.159779</td>\n",
       "      <td>0.344948</td>\n",
       "      <td>0.011499</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4996</th>\n",
       "      <td>7.656651</td>\n",
       "      <td>6.411748</td>\n",
       "      <td>5.655960</td>\n",
       "      <td>6.045712</td>\n",
       "      <td>3.193900</td>\n",
       "      <td>-0.918944</td>\n",
       "      <td>-1.377013</td>\n",
       "      <td>-0.897943</td>\n",
       "      <td>0.443617</td>\n",
       "      <td>0.490799</td>\n",
       "      <td>0.988511</td>\n",
       "      <td>0.788984</td>\n",
       "      <td>0.086436</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4997</th>\n",
       "      <td>1.069438</td>\n",
       "      <td>6.581439</td>\n",
       "      <td>1.230892</td>\n",
       "      <td>9.937483</td>\n",
       "      <td>3.756828</td>\n",
       "      <td>-1.524720</td>\n",
       "      <td>-0.516322</td>\n",
       "      <td>-1.715786</td>\n",
       "      <td>0.501101</td>\n",
       "      <td>0.381437</td>\n",
       "      <td>0.773236</td>\n",
       "      <td>0.822149</td>\n",
       "      <td>-0.025390</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4998</th>\n",
       "      <td>4.629745</td>\n",
       "      <td>8.353612</td>\n",
       "      <td>8.119304</td>\n",
       "      <td>8.600847</td>\n",
       "      <td>2.960941</td>\n",
       "      <td>-1.424327</td>\n",
       "      <td>-0.890685</td>\n",
       "      <td>-0.645929</td>\n",
       "      <td>0.383265</td>\n",
       "      <td>0.241701</td>\n",
       "      <td>0.609101</td>\n",
       "      <td>0.756135</td>\n",
       "      <td>0.052382</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4999</th>\n",
       "      <td>0.754512</td>\n",
       "      <td>9.723392</td>\n",
       "      <td>9.264871</td>\n",
       "      <td>1.415836</td>\n",
       "      <td>5.029876</td>\n",
       "      <td>-1.281568</td>\n",
       "      <td>-1.946921</td>\n",
       "      <td>-1.801387</td>\n",
       "      <td>0.448670</td>\n",
       "      <td>0.413843</td>\n",
       "      <td>0.273108</td>\n",
       "      <td>0.251181</td>\n",
       "      <td>-0.036986</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1500 rows × 13 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          tau1      tau2      tau3      tau4        p1        p2        p3  \\\n",
       "3500  7.592223  1.389509  7.285896  6.031028  4.901480 -1.809328 -1.536639   \n",
       "3501  9.203739  3.031134  2.742088  7.318112  4.379546 -1.160296 -1.374819   \n",
       "3502  4.016004  8.501127  5.345373  6.943443  2.952986 -0.535994 -1.375817   \n",
       "3503  1.568860  2.338635  7.562933  0.931341  3.180046 -1.887828 -0.673774   \n",
       "3504  8.906023  4.356134  4.086695  1.396348  4.998403 -1.232689 -1.910843   \n",
       "...        ...       ...       ...       ...       ...       ...       ...   \n",
       "4995  3.592940  8.130493  3.270724  8.075292  4.772430 -1.458529 -1.690274   \n",
       "4996  7.656651  6.411748  5.655960  6.045712  3.193900 -0.918944 -1.377013   \n",
       "4997  1.069438  6.581439  1.230892  9.937483  3.756828 -1.524720 -0.516322   \n",
       "4998  4.629745  8.353612  8.119304  8.600847  2.960941 -1.424327 -0.890685   \n",
       "4999  0.754512  9.723392  9.264871  1.415836  5.029876 -1.281568 -1.946921   \n",
       "\n",
       "            p4        g1        g2        g3        g4      stab  \n",
       "3500 -1.555512  0.444016  0.469558  0.559769  0.170529  0.001593  \n",
       "3501 -1.844431  0.322139  0.945597  0.786776  0.527852  0.015995  \n",
       "3502 -1.041175  0.662382  0.300356  0.251775  0.559976  0.027832  \n",
       "3503 -0.618444  0.321079  0.081876  0.298656  0.078052 -0.051548  \n",
       "3504 -1.854870  0.143437  0.556369  0.929642  0.686855  0.007881  \n",
       "...        ...       ...       ...       ...       ...       ...  \n",
       "4995 -1.623627  0.210123  0.683625  0.159779  0.344948  0.011499  \n",
       "4996 -0.897943  0.443617  0.490799  0.988511  0.788984  0.086436  \n",
       "4997 -1.715786  0.501101  0.381437  0.773236  0.822149 -0.025390  \n",
       "4998 -0.645929  0.383265  0.241701  0.609101  0.756135  0.052382  \n",
       "4999 -1.801387  0.448670  0.413843  0.273108  0.251181 -0.036986  \n",
       "\n",
       "[1500 rows x 13 columns]"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Save class values for train and test sets\n",
    "train_labels = train_data['stabf'].to_numpy()\n",
    "test_labels = test_data['stabf'].to_numpy()\n",
    "\n",
    "# Drop class column from train and test sets\n",
    "train = train_data.drop('stabf', axis=1)\n",
    "test = test_data.drop('stabf', axis=1)\n",
    "test"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "147cb7ee",
   "metadata": {
    "column": 3,
    "index": 9,
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[ 7.59222336e+00,  1.38950867e+00,  7.28589559e+00, ...,\n",
       "         5.59768619e-01,  1.70528709e-01,  1.59300624e-03],\n",
       "       [ 9.20373904e+00,  3.03113388e+00,  2.74208849e+00, ...,\n",
       "         7.86776143e-01,  5.27851948e-01,  1.59949946e-02],\n",
       "       [ 4.01600415e+00,  8.50112731e+00,  5.34537329e+00, ...,\n",
       "         2.51774855e-01,  5.59975960e-01,  2.78322527e-02],\n",
       "       ...,\n",
       "       [ 1.06943762e+00,  6.58143888e+00,  1.23089213e+00, ...,\n",
       "         7.73236128e-01,  8.22149435e-01, -2.53904805e-02],\n",
       "       [ 4.62974535e+00,  8.35361207e+00,  8.11930402e+00, ...,\n",
       "         6.09100855e-01,  7.56135124e-01,  5.23822770e-02],\n",
       "       [ 7.54511861e-01,  9.72339201e+00,  9.26487092e+00, ...,\n",
       "         2.73108030e-01,  2.51180820e-01, -3.69859336e-02]])"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Convert train and test to numpy arrays\n",
    "train = train.to_numpy()\n",
    "test = test.to_numpy()\n",
    "test"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "c89e2526",
   "metadata": {
    "column": 3,
    "index": 10,
    "scrolled": false
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[ 0.03294783,  0.0059878 ,  0.03189501, ...,  0.02445562,\n",
       "         0.00752012,  0.00101395],\n",
       "       [ 0.03994129,  0.01306203,  0.01200387, ...,  0.03437331,\n",
       "         0.02327766,  0.01018084],\n",
       "       [ 0.01742818,  0.03663382,  0.02340011, ...,  0.01099974,\n",
       "         0.02469429,  0.01771527],\n",
       "       ...,\n",
       "       [ 0.00464102,  0.02836133,  0.0053884 , ...,  0.03378176,\n",
       "         0.03625584, -0.01616108],\n",
       "       [ 0.02009162,  0.03599814,  0.03554337, ...,  0.02661089,\n",
       "         0.03334468,  0.03334139],\n",
       "       [ 0.00327434,  0.04190091,  0.04055825, ...,  0.01193176,\n",
       "         0.01107678, -0.0235416 ]])"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# normalize the datasets\n",
    "train = normalize(train, axis=0)\n",
    "test = normalize(test, axis=0)\n",
    "test"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "413f8f25",
   "metadata": {
    "column": 3,
    "index": 11
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[0.0529621 , 0.04462797, 0.05458674, ..., 0.06326677, 0.05746328,\n",
       "        0.04569973],\n",
       "       [0.04906884, 0.04705974, 0.05646954, ..., 0.06194467, 0.05296708,\n",
       "        0.05821566],\n",
       "       [0.03821409, 0.05069847, 0.05365513, ..., 0.0557102 , 0.0613269 ,\n",
       "        0.053487  ],\n",
       "       ...,\n",
       "       [0.05835539, 0.05998833, 0.06828727, ..., 0.0537749 , 0.04646163,\n",
       "        0.06121794],\n",
       "       [0.04297523, 0.06438266, 0.06614503, ..., 0.06783632, 0.07152282,\n",
       "        0.0638074 ],\n",
       "       [0.07608597, 0.06118565, 0.06595964, ..., 0.06664703, 0.07698337,\n",
       "        0.07384184]])"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Calculate the Euclidean distances using no loops\n",
    "num_test = test.shape[0]\n",
    "num_train = train.shape[0]\n",
    "dists = np.zeros((num_test, num_train)) \n",
    "sum_squares_train = np.sum(np.square(train), axis=1)\n",
    "sum_squares_test = np.sum(np.square(test), axis=1)\n",
    "sum_combo = np.dot(test, train.T) * -2\n",
    "# Store the distances in the distance matrix\n",
    "dists = np.sqrt(((sum_combo + sum_squares_train).T + sum_squares_test).T)\n",
    "dists"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "3f6d7143",
   "metadata": {
    "column": 3,
    "index": 12
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([1., 1., 1., ..., 0., 1., 0.])"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Make predictions using k nearest neighbors\n",
    "\n",
    "k = 13\n",
    "num_test = dists.shape[0]\n",
    "y_pred = np.zeros(num_test)\n",
    "for i in range(num_test):\n",
    "    nearest_neighbors_indices = np.argsort(dists[i])\n",
    "    closest_y = np.zeros(k)\n",
    "    for m in range(k):\n",
    "        closest_y[m] = train_labels[nearest_neighbors_indices[m]]\n",
    "    labels = []\n",
    "    label_counts = []\n",
    "    for label in closest_y:\n",
    "        if label not in labels:\n",
    "          labels.append(label)\n",
    "          label_counts.append(1)\n",
    "        else:\n",
    "          label_counts[labels.index(label)] = label_counts[labels.index(label)] + 1\n",
    "    mode_labels = np.argsort(label_counts)[::-1]\n",
    "    y_pred[i] = labels[mode_labels[0]]\n",
    "y_pred"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "6af11fab",
   "metadata": {
    "column": 3,
    "index": 13
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Got 1424 / 1500 correct => accuracy: 0.949333\n"
     ]
    }
   ],
   "source": [
    "# Compute and print the fraction of correctly predicted examples\n",
    "num_correct = np.sum(y_pred == test_labels)\n",
    "accuracy = float(num_correct) / num_test\n",
    "print('Got %d / %d correct => accuracy: %f' % (num_correct, num_test, accuracy))"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "e1fbd334",
   "metadata": {
    "column": 3,
    "index": 14
   },
   "source": [
    "# Section 3: 2nd Analysis"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "bdb19612",
   "metadata": {
    "column": 3,
    "index": 15
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tau1</th>\n",
       "      <th>tau2</th>\n",
       "      <th>tau3</th>\n",
       "      <th>tau4</th>\n",
       "      <th>p1</th>\n",
       "      <th>p2</th>\n",
       "      <th>p3</th>\n",
       "      <th>p4</th>\n",
       "      <th>g1</th>\n",
       "      <th>g2</th>\n",
       "      <th>g3</th>\n",
       "      <th>g4</th>\n",
       "      <th>stab</th>\n",
       "      <th>stabf</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>5000</th>\n",
       "      <td>5.825547</td>\n",
       "      <td>6.153305</td>\n",
       "      <td>9.215683</td>\n",
       "      <td>2.644971</td>\n",
       "      <td>4.749492</td>\n",
       "      <td>-1.491278</td>\n",
       "      <td>-1.382048</td>\n",
       "      <td>-1.876166</td>\n",
       "      <td>0.528459</td>\n",
       "      <td>0.155706</td>\n",
       "      <td>0.156222</td>\n",
       "      <td>0.458131</td>\n",
       "      <td>-0.023089</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5001</th>\n",
       "      <td>2.750088</td>\n",
       "      <td>8.767781</td>\n",
       "      <td>4.517367</td>\n",
       "      <td>1.373404</td>\n",
       "      <td>2.700511</td>\n",
       "      <td>-0.587310</td>\n",
       "      <td>-1.190554</td>\n",
       "      <td>-0.922647</td>\n",
       "      <td>0.471845</td>\n",
       "      <td>0.428823</td>\n",
       "      <td>0.596576</td>\n",
       "      <td>0.249577</td>\n",
       "      <td>-0.021277</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5002</th>\n",
       "      <td>6.253534</td>\n",
       "      <td>6.625686</td>\n",
       "      <td>0.613047</td>\n",
       "      <td>7.550439</td>\n",
       "      <td>4.305593</td>\n",
       "      <td>-1.529390</td>\n",
       "      <td>-1.415248</td>\n",
       "      <td>-1.360955</td>\n",
       "      <td>0.376768</td>\n",
       "      <td>0.686419</td>\n",
       "      <td>0.598896</td>\n",
       "      <td>0.408225</td>\n",
       "      <td>0.009619</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5003</th>\n",
       "      <td>1.800725</td>\n",
       "      <td>1.185765</td>\n",
       "      <td>1.515843</td>\n",
       "      <td>8.576087</td>\n",
       "      <td>4.255226</td>\n",
       "      <td>-1.270079</td>\n",
       "      <td>-1.970055</td>\n",
       "      <td>-1.015092</td>\n",
       "      <td>0.341150</td>\n",
       "      <td>0.623442</td>\n",
       "      <td>0.247956</td>\n",
       "      <td>0.653949</td>\n",
       "      <td>-0.038621</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5004</th>\n",
       "      <td>7.150430</td>\n",
       "      <td>4.837233</td>\n",
       "      <td>3.244408</td>\n",
       "      <td>2.089166</td>\n",
       "      <td>4.539624</td>\n",
       "      <td>-1.981831</td>\n",
       "      <td>-1.375972</td>\n",
       "      <td>-1.181821</td>\n",
       "      <td>0.319280</td>\n",
       "      <td>0.072775</td>\n",
       "      <td>0.842072</td>\n",
       "      <td>0.577839</td>\n",
       "      <td>-0.027978</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9995</th>\n",
       "      <td>2.930406</td>\n",
       "      <td>9.487627</td>\n",
       "      <td>2.376523</td>\n",
       "      <td>6.187797</td>\n",
       "      <td>3.343416</td>\n",
       "      <td>-0.658054</td>\n",
       "      <td>-1.449106</td>\n",
       "      <td>-1.236256</td>\n",
       "      <td>0.601709</td>\n",
       "      <td>0.779642</td>\n",
       "      <td>0.813512</td>\n",
       "      <td>0.608385</td>\n",
       "      <td>0.023892</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9996</th>\n",
       "      <td>3.392299</td>\n",
       "      <td>1.274827</td>\n",
       "      <td>2.954947</td>\n",
       "      <td>6.894759</td>\n",
       "      <td>4.349512</td>\n",
       "      <td>-1.663661</td>\n",
       "      <td>-0.952437</td>\n",
       "      <td>-1.733414</td>\n",
       "      <td>0.502079</td>\n",
       "      <td>0.567242</td>\n",
       "      <td>0.285880</td>\n",
       "      <td>0.366120</td>\n",
       "      <td>-0.025803</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9997</th>\n",
       "      <td>2.364034</td>\n",
       "      <td>2.842030</td>\n",
       "      <td>8.776391</td>\n",
       "      <td>1.008906</td>\n",
       "      <td>4.299976</td>\n",
       "      <td>-1.380719</td>\n",
       "      <td>-0.943884</td>\n",
       "      <td>-1.975373</td>\n",
       "      <td>0.487838</td>\n",
       "      <td>0.986505</td>\n",
       "      <td>0.149286</td>\n",
       "      <td>0.145984</td>\n",
       "      <td>-0.031810</td>\n",
       "      <td>stable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9998</th>\n",
       "      <td>9.631511</td>\n",
       "      <td>3.994398</td>\n",
       "      <td>2.757071</td>\n",
       "      <td>7.821347</td>\n",
       "      <td>2.514755</td>\n",
       "      <td>-0.966330</td>\n",
       "      <td>-0.649915</td>\n",
       "      <td>-0.898510</td>\n",
       "      <td>0.365246</td>\n",
       "      <td>0.587558</td>\n",
       "      <td>0.889118</td>\n",
       "      <td>0.818391</td>\n",
       "      <td>0.037789</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9999</th>\n",
       "      <td>6.530527</td>\n",
       "      <td>6.781790</td>\n",
       "      <td>4.349695</td>\n",
       "      <td>8.673138</td>\n",
       "      <td>3.492807</td>\n",
       "      <td>-1.390285</td>\n",
       "      <td>-1.532193</td>\n",
       "      <td>-0.570329</td>\n",
       "      <td>0.073056</td>\n",
       "      <td>0.505441</td>\n",
       "      <td>0.378761</td>\n",
       "      <td>0.942631</td>\n",
       "      <td>0.045263</td>\n",
       "      <td>unstable</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5000 rows × 14 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          tau1      tau2      tau3      tau4        p1        p2        p3  \\\n",
       "5000  5.825547  6.153305  9.215683  2.644971  4.749492 -1.491278 -1.382048   \n",
       "5001  2.750088  8.767781  4.517367  1.373404  2.700511 -0.587310 -1.190554   \n",
       "5002  6.253534  6.625686  0.613047  7.550439  4.305593 -1.529390 -1.415248   \n",
       "5003  1.800725  1.185765  1.515843  8.576087  4.255226 -1.270079 -1.970055   \n",
       "5004  7.150430  4.837233  3.244408  2.089166  4.539624 -1.981831 -1.375972   \n",
       "...        ...       ...       ...       ...       ...       ...       ...   \n",
       "9995  2.930406  9.487627  2.376523  6.187797  3.343416 -0.658054 -1.449106   \n",
       "9996  3.392299  1.274827  2.954947  6.894759  4.349512 -1.663661 -0.952437   \n",
       "9997  2.364034  2.842030  8.776391  1.008906  4.299976 -1.380719 -0.943884   \n",
       "9998  9.631511  3.994398  2.757071  7.821347  2.514755 -0.966330 -0.649915   \n",
       "9999  6.530527  6.781790  4.349695  8.673138  3.492807 -1.390285 -1.532193   \n",
       "\n",
       "            p4        g1        g2        g3        g4      stab     stabf  \n",
       "5000 -1.876166  0.528459  0.155706  0.156222  0.458131 -0.023089    stable  \n",
       "5001 -0.922647  0.471845  0.428823  0.596576  0.249577 -0.021277    stable  \n",
       "5002 -1.360955  0.376768  0.686419  0.598896  0.408225  0.009619  unstable  \n",
       "5003 -1.015092  0.341150  0.623442  0.247956  0.653949 -0.038621    stable  \n",
       "5004 -1.181821  0.319280  0.072775  0.842072  0.577839 -0.027978    stable  \n",
       "...        ...       ...       ...       ...       ...       ...       ...  \n",
       "9995 -1.236256  0.601709  0.779642  0.813512  0.608385  0.023892  unstable  \n",
       "9996 -1.733414  0.502079  0.567242  0.285880  0.366120 -0.025803    stable  \n",
       "9997 -1.975373  0.487838  0.986505  0.149286  0.145984 -0.031810    stable  \n",
       "9998 -0.898510  0.365246  0.587558  0.889118  0.818391  0.037789  unstable  \n",
       "9999 -0.570329  0.073056  0.505441  0.378761  0.942631  0.045263  unstable  \n",
       "\n",
       "[5000 rows x 14 columns]"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "my_data = data.tail(5000)\n",
    "my_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "997e3cd5",
   "metadata": {
    "column": 3,
    "index": 16
   },
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "C:\\Users\\harde\\AppData\\Local\\Programs\\Python\\Python39\\lib\\site-packages\\pandas\\core\\indexing.py:1817: SettingWithCopyWarning: \n",
      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
      "Try using .loc[row_indexer,col_indexer] = value instead\n",
      "\n",
      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
      "  self._setitem_single_column(loc, value, pi)\n",
      "C:\\Users\\harde\\AppData\\Local\\Temp\\ipykernel_21872\\9913949.py:8: SettingWithCopyWarning: \n",
      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
      "Try using .loc[row_indexer,col_indexer] = value instead\n",
      "\n",
      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
      "  my_data['stabf'] = pd.to_numeric(my_data['stabf'])\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tau1</th>\n",
       "      <th>tau2</th>\n",
       "      <th>tau3</th>\n",
       "      <th>tau4</th>\n",
       "      <th>p1</th>\n",
       "      <th>p2</th>\n",
       "      <th>p3</th>\n",
       "      <th>p4</th>\n",
       "      <th>g1</th>\n",
       "      <th>g2</th>\n",
       "      <th>g3</th>\n",
       "      <th>g4</th>\n",
       "      <th>stab</th>\n",
       "      <th>stabf</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>5000</th>\n",
       "      <td>5.825547</td>\n",
       "      <td>6.153305</td>\n",
       "      <td>9.215683</td>\n",
       "      <td>2.644971</td>\n",
       "      <td>4.749492</td>\n",
       "      <td>-1.491278</td>\n",
       "      <td>-1.382048</td>\n",
       "      <td>-1.876166</td>\n",
       "      <td>0.528459</td>\n",
       "      <td>0.155706</td>\n",
       "      <td>0.156222</td>\n",
       "      <td>0.458131</td>\n",
       "      <td>-0.023089</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5001</th>\n",
       "      <td>2.750088</td>\n",
       "      <td>8.767781</td>\n",
       "      <td>4.517367</td>\n",
       "      <td>1.373404</td>\n",
       "      <td>2.700511</td>\n",
       "      <td>-0.587310</td>\n",
       "      <td>-1.190554</td>\n",
       "      <td>-0.922647</td>\n",
       "      <td>0.471845</td>\n",
       "      <td>0.428823</td>\n",
       "      <td>0.596576</td>\n",
       "      <td>0.249577</td>\n",
       "      <td>-0.021277</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5002</th>\n",
       "      <td>6.253534</td>\n",
       "      <td>6.625686</td>\n",
       "      <td>0.613047</td>\n",
       "      <td>7.550439</td>\n",
       "      <td>4.305593</td>\n",
       "      <td>-1.529390</td>\n",
       "      <td>-1.415248</td>\n",
       "      <td>-1.360955</td>\n",
       "      <td>0.376768</td>\n",
       "      <td>0.686419</td>\n",
       "      <td>0.598896</td>\n",
       "      <td>0.408225</td>\n",
       "      <td>0.009619</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5003</th>\n",
       "      <td>1.800725</td>\n",
       "      <td>1.185765</td>\n",
       "      <td>1.515843</td>\n",
       "      <td>8.576087</td>\n",
       "      <td>4.255226</td>\n",
       "      <td>-1.270079</td>\n",
       "      <td>-1.970055</td>\n",
       "      <td>-1.015092</td>\n",
       "      <td>0.341150</td>\n",
       "      <td>0.623442</td>\n",
       "      <td>0.247956</td>\n",
       "      <td>0.653949</td>\n",
       "      <td>-0.038621</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5004</th>\n",
       "      <td>7.150430</td>\n",
       "      <td>4.837233</td>\n",
       "      <td>3.244408</td>\n",
       "      <td>2.089166</td>\n",
       "      <td>4.539624</td>\n",
       "      <td>-1.981831</td>\n",
       "      <td>-1.375972</td>\n",
       "      <td>-1.181821</td>\n",
       "      <td>0.319280</td>\n",
       "      <td>0.072775</td>\n",
       "      <td>0.842072</td>\n",
       "      <td>0.577839</td>\n",
       "      <td>-0.027978</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9995</th>\n",
       "      <td>2.930406</td>\n",
       "      <td>9.487627</td>\n",
       "      <td>2.376523</td>\n",
       "      <td>6.187797</td>\n",
       "      <td>3.343416</td>\n",
       "      <td>-0.658054</td>\n",
       "      <td>-1.449106</td>\n",
       "      <td>-1.236256</td>\n",
       "      <td>0.601709</td>\n",
       "      <td>0.779642</td>\n",
       "      <td>0.813512</td>\n",
       "      <td>0.608385</td>\n",
       "      <td>0.023892</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9996</th>\n",
       "      <td>3.392299</td>\n",
       "      <td>1.274827</td>\n",
       "      <td>2.954947</td>\n",
       "      <td>6.894759</td>\n",
       "      <td>4.349512</td>\n",
       "      <td>-1.663661</td>\n",
       "      <td>-0.952437</td>\n",
       "      <td>-1.733414</td>\n",
       "      <td>0.502079</td>\n",
       "      <td>0.567242</td>\n",
       "      <td>0.285880</td>\n",
       "      <td>0.366120</td>\n",
       "      <td>-0.025803</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9997</th>\n",
       "      <td>2.364034</td>\n",
       "      <td>2.842030</td>\n",
       "      <td>8.776391</td>\n",
       "      <td>1.008906</td>\n",
       "      <td>4.299976</td>\n",
       "      <td>-1.380719</td>\n",
       "      <td>-0.943884</td>\n",
       "      <td>-1.975373</td>\n",
       "      <td>0.487838</td>\n",
       "      <td>0.986505</td>\n",
       "      <td>0.149286</td>\n",
       "      <td>0.145984</td>\n",
       "      <td>-0.031810</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9998</th>\n",
       "      <td>9.631511</td>\n",
       "      <td>3.994398</td>\n",
       "      <td>2.757071</td>\n",
       "      <td>7.821347</td>\n",
       "      <td>2.514755</td>\n",
       "      <td>-0.966330</td>\n",
       "      <td>-0.649915</td>\n",
       "      <td>-0.898510</td>\n",
       "      <td>0.365246</td>\n",
       "      <td>0.587558</td>\n",
       "      <td>0.889118</td>\n",
       "      <td>0.818391</td>\n",
       "      <td>0.037789</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9999</th>\n",
       "      <td>6.530527</td>\n",
       "      <td>6.781790</td>\n",
       "      <td>4.349695</td>\n",
       "      <td>8.673138</td>\n",
       "      <td>3.492807</td>\n",
       "      <td>-1.390285</td>\n",
       "      <td>-1.532193</td>\n",
       "      <td>-0.570329</td>\n",
       "      <td>0.073056</td>\n",
       "      <td>0.505441</td>\n",
       "      <td>0.378761</td>\n",
       "      <td>0.942631</td>\n",
       "      <td>0.045263</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5000 rows × 14 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          tau1      tau2      tau3      tau4        p1        p2        p3  \\\n",
       "5000  5.825547  6.153305  9.215683  2.644971  4.749492 -1.491278 -1.382048   \n",
       "5001  2.750088  8.767781  4.517367  1.373404  2.700511 -0.587310 -1.190554   \n",
       "5002  6.253534  6.625686  0.613047  7.550439  4.305593 -1.529390 -1.415248   \n",
       "5003  1.800725  1.185765  1.515843  8.576087  4.255226 -1.270079 -1.970055   \n",
       "5004  7.150430  4.837233  3.244408  2.089166  4.539624 -1.981831 -1.375972   \n",
       "...        ...       ...       ...       ...       ...       ...       ...   \n",
       "9995  2.930406  9.487627  2.376523  6.187797  3.343416 -0.658054 -1.449106   \n",
       "9996  3.392299  1.274827  2.954947  6.894759  4.349512 -1.663661 -0.952437   \n",
       "9997  2.364034  2.842030  8.776391  1.008906  4.299976 -1.380719 -0.943884   \n",
       "9998  9.631511  3.994398  2.757071  7.821347  2.514755 -0.966330 -0.649915   \n",
       "9999  6.530527  6.781790  4.349695  8.673138  3.492807 -1.390285 -1.532193   \n",
       "\n",
       "            p4        g1        g2        g3        g4      stab  stabf  \n",
       "5000 -1.876166  0.528459  0.155706  0.156222  0.458131 -0.023089      0  \n",
       "5001 -0.922647  0.471845  0.428823  0.596576  0.249577 -0.021277      0  \n",
       "5002 -1.360955  0.376768  0.686419  0.598896  0.408225  0.009619      1  \n",
       "5003 -1.015092  0.341150  0.623442  0.247956  0.653949 -0.038621      0  \n",
       "5004 -1.181821  0.319280  0.072775  0.842072  0.577839 -0.027978      0  \n",
       "...        ...       ...       ...       ...       ...       ...    ...  \n",
       "9995 -1.236256  0.601709  0.779642  0.813512  0.608385  0.023892      1  \n",
       "9996 -1.733414  0.502079  0.567242  0.285880  0.366120 -0.025803      0  \n",
       "9997 -1.975373  0.487838  0.986505  0.149286  0.145984 -0.031810      0  \n",
       "9998 -0.898510  0.365246  0.587558  0.889118  0.818391  0.037789      1  \n",
       "9999 -0.570329  0.073056  0.505441  0.378761  0.942631  0.045263      1  \n",
       "\n",
       "[5000 rows x 14 columns]"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Convert Class names to numbers\n",
    "# 0 = stable\n",
    "# 1 = unstable\n",
    "\n",
    "# assign values to the dependent variable\n",
    "my_data.loc[(my_data['stabf'] == 'stable'), 'stabf'] = 0\n",
    "my_data.loc[(my_data['stabf'] == 'unstable'), 'stabf'] = 1\n",
    "my_data['stabf'] = pd.to_numeric(my_data['stabf'])\n",
    "my_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "56d7de20",
   "metadata": {
    "column": 3,
    "index": 17
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tau1</th>\n",
       "      <th>tau2</th>\n",
       "      <th>tau3</th>\n",
       "      <th>tau4</th>\n",
       "      <th>p1</th>\n",
       "      <th>p2</th>\n",
       "      <th>p3</th>\n",
       "      <th>p4</th>\n",
       "      <th>g1</th>\n",
       "      <th>g2</th>\n",
       "      <th>g3</th>\n",
       "      <th>g4</th>\n",
       "      <th>stab</th>\n",
       "      <th>stabf</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>8000</th>\n",
       "      <td>5.306905</td>\n",
       "      <td>2.452792</td>\n",
       "      <td>5.414825</td>\n",
       "      <td>4.964973</td>\n",
       "      <td>2.853706</td>\n",
       "      <td>-0.952709</td>\n",
       "      <td>-1.391630</td>\n",
       "      <td>-0.509366</td>\n",
       "      <td>0.160440</td>\n",
       "      <td>0.958669</td>\n",
       "      <td>0.867021</td>\n",
       "      <td>0.183520</td>\n",
       "      <td>0.026496</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8001</th>\n",
       "      <td>7.745244</td>\n",
       "      <td>4.311693</td>\n",
       "      <td>7.893386</td>\n",
       "      <td>0.917804</td>\n",
       "      <td>3.457962</td>\n",
       "      <td>-1.425012</td>\n",
       "      <td>-1.291345</td>\n",
       "      <td>-0.741605</td>\n",
       "      <td>0.576198</td>\n",
       "      <td>0.851929</td>\n",
       "      <td>0.172012</td>\n",
       "      <td>0.788637</td>\n",
       "      <td>-0.004614</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8002</th>\n",
       "      <td>5.279096</td>\n",
       "      <td>5.458030</td>\n",
       "      <td>4.123039</td>\n",
       "      <td>9.860768</td>\n",
       "      <td>2.441075</td>\n",
       "      <td>-1.028213</td>\n",
       "      <td>-0.790346</td>\n",
       "      <td>-0.622516</td>\n",
       "      <td>0.462567</td>\n",
       "      <td>0.287156</td>\n",
       "      <td>0.252946</td>\n",
       "      <td>0.663104</td>\n",
       "      <td>0.021423</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8003</th>\n",
       "      <td>1.596736</td>\n",
       "      <td>5.744044</td>\n",
       "      <td>5.888295</td>\n",
       "      <td>2.434392</td>\n",
       "      <td>3.762364</td>\n",
       "      <td>-1.019351</td>\n",
       "      <td>-0.869846</td>\n",
       "      <td>-1.873167</td>\n",
       "      <td>0.769447</td>\n",
       "      <td>0.733218</td>\n",
       "      <td>0.096916</td>\n",
       "      <td>0.159050</td>\n",
       "      <td>-0.033336</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8004</th>\n",
       "      <td>7.214450</td>\n",
       "      <td>2.265906</td>\n",
       "      <td>3.889059</td>\n",
       "      <td>9.012663</td>\n",
       "      <td>3.675266</td>\n",
       "      <td>-0.722557</td>\n",
       "      <td>-1.249246</td>\n",
       "      <td>-1.703463</td>\n",
       "      <td>0.837425</td>\n",
       "      <td>0.599088</td>\n",
       "      <td>0.975245</td>\n",
       "      <td>0.772472</td>\n",
       "      <td>0.061052</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9995</th>\n",
       "      <td>2.930406</td>\n",
       "      <td>9.487627</td>\n",
       "      <td>2.376523</td>\n",
       "      <td>6.187797</td>\n",
       "      <td>3.343416</td>\n",
       "      <td>-0.658054</td>\n",
       "      <td>-1.449106</td>\n",
       "      <td>-1.236256</td>\n",
       "      <td>0.601709</td>\n",
       "      <td>0.779642</td>\n",
       "      <td>0.813512</td>\n",
       "      <td>0.608385</td>\n",
       "      <td>0.023892</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9996</th>\n",
       "      <td>3.392299</td>\n",
       "      <td>1.274827</td>\n",
       "      <td>2.954947</td>\n",
       "      <td>6.894759</td>\n",
       "      <td>4.349512</td>\n",
       "      <td>-1.663661</td>\n",
       "      <td>-0.952437</td>\n",
       "      <td>-1.733414</td>\n",
       "      <td>0.502079</td>\n",
       "      <td>0.567242</td>\n",
       "      <td>0.285880</td>\n",
       "      <td>0.366120</td>\n",
       "      <td>-0.025803</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9997</th>\n",
       "      <td>2.364034</td>\n",
       "      <td>2.842030</td>\n",
       "      <td>8.776391</td>\n",
       "      <td>1.008906</td>\n",
       "      <td>4.299976</td>\n",
       "      <td>-1.380719</td>\n",
       "      <td>-0.943884</td>\n",
       "      <td>-1.975373</td>\n",
       "      <td>0.487838</td>\n",
       "      <td>0.986505</td>\n",
       "      <td>0.149286</td>\n",
       "      <td>0.145984</td>\n",
       "      <td>-0.031810</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9998</th>\n",
       "      <td>9.631511</td>\n",
       "      <td>3.994398</td>\n",
       "      <td>2.757071</td>\n",
       "      <td>7.821347</td>\n",
       "      <td>2.514755</td>\n",
       "      <td>-0.966330</td>\n",
       "      <td>-0.649915</td>\n",
       "      <td>-0.898510</td>\n",
       "      <td>0.365246</td>\n",
       "      <td>0.587558</td>\n",
       "      <td>0.889118</td>\n",
       "      <td>0.818391</td>\n",
       "      <td>0.037789</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9999</th>\n",
       "      <td>6.530527</td>\n",
       "      <td>6.781790</td>\n",
       "      <td>4.349695</td>\n",
       "      <td>8.673138</td>\n",
       "      <td>3.492807</td>\n",
       "      <td>-1.390285</td>\n",
       "      <td>-1.532193</td>\n",
       "      <td>-0.570329</td>\n",
       "      <td>0.073056</td>\n",
       "      <td>0.505441</td>\n",
       "      <td>0.378761</td>\n",
       "      <td>0.942631</td>\n",
       "      <td>0.045263</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2000 rows × 14 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          tau1      tau2      tau3      tau4        p1        p2        p3  \\\n",
       "8000  5.306905  2.452792  5.414825  4.964973  2.853706 -0.952709 -1.391630   \n",
       "8001  7.745244  4.311693  7.893386  0.917804  3.457962 -1.425012 -1.291345   \n",
       "8002  5.279096  5.458030  4.123039  9.860768  2.441075 -1.028213 -0.790346   \n",
       "8003  1.596736  5.744044  5.888295  2.434392  3.762364 -1.019351 -0.869846   \n",
       "8004  7.214450  2.265906  3.889059  9.012663  3.675266 -0.722557 -1.249246   \n",
       "...        ...       ...       ...       ...       ...       ...       ...   \n",
       "9995  2.930406  9.487627  2.376523  6.187797  3.343416 -0.658054 -1.449106   \n",
       "9996  3.392299  1.274827  2.954947  6.894759  4.349512 -1.663661 -0.952437   \n",
       "9997  2.364034  2.842030  8.776391  1.008906  4.299976 -1.380719 -0.943884   \n",
       "9998  9.631511  3.994398  2.757071  7.821347  2.514755 -0.966330 -0.649915   \n",
       "9999  6.530527  6.781790  4.349695  8.673138  3.492807 -1.390285 -1.532193   \n",
       "\n",
       "            p4        g1        g2        g3        g4      stab  stabf  \n",
       "8000 -0.509366  0.160440  0.958669  0.867021  0.183520  0.026496      1  \n",
       "8001 -0.741605  0.576198  0.851929  0.172012  0.788637 -0.004614      0  \n",
       "8002 -0.622516  0.462567  0.287156  0.252946  0.663104  0.021423      1  \n",
       "8003 -1.873167  0.769447  0.733218  0.096916  0.159050 -0.033336      0  \n",
       "8004 -1.703463  0.837425  0.599088  0.975245  0.772472  0.061052      1  \n",
       "...        ...       ...       ...       ...       ...       ...    ...  \n",
       "9995 -1.236256  0.601709  0.779642  0.813512  0.608385  0.023892      1  \n",
       "9996 -1.733414  0.502079  0.567242  0.285880  0.366120 -0.025803      0  \n",
       "9997 -1.975373  0.487838  0.986505  0.149286  0.145984 -0.031810      0  \n",
       "9998 -0.898510  0.365246  0.587558  0.889118  0.818391  0.037789      1  \n",
       "9999 -0.570329  0.073056  0.505441  0.378761  0.942631  0.045263      1  \n",
       "\n",
       "[2000 rows x 14 columns]"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Split dataframe into testing and training sets\n",
    "train_data = my_data.iloc[:3000]\n",
    "test_data = my_data.iloc[3000:]\n",
    "test_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "163334ca",
   "metadata": {
    "column": 3,
    "index": 18
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tau1</th>\n",
       "      <th>tau2</th>\n",
       "      <th>tau3</th>\n",
       "      <th>tau4</th>\n",
       "      <th>p1</th>\n",
       "      <th>p2</th>\n",
       "      <th>p3</th>\n",
       "      <th>p4</th>\n",
       "      <th>g1</th>\n",
       "      <th>g2</th>\n",
       "      <th>g3</th>\n",
       "      <th>g4</th>\n",
       "      <th>stab</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>8000</th>\n",
       "      <td>5.306905</td>\n",
       "      <td>2.452792</td>\n",
       "      <td>5.414825</td>\n",
       "      <td>4.964973</td>\n",
       "      <td>2.853706</td>\n",
       "      <td>-0.952709</td>\n",
       "      <td>-1.391630</td>\n",
       "      <td>-0.509366</td>\n",
       "      <td>0.160440</td>\n",
       "      <td>0.958669</td>\n",
       "      <td>0.867021</td>\n",
       "      <td>0.183520</td>\n",
       "      <td>0.026496</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8001</th>\n",
       "      <td>7.745244</td>\n",
       "      <td>4.311693</td>\n",
       "      <td>7.893386</td>\n",
       "      <td>0.917804</td>\n",
       "      <td>3.457962</td>\n",
       "      <td>-1.425012</td>\n",
       "      <td>-1.291345</td>\n",
       "      <td>-0.741605</td>\n",
       "      <td>0.576198</td>\n",
       "      <td>0.851929</td>\n",
       "      <td>0.172012</td>\n",
       "      <td>0.788637</td>\n",
       "      <td>-0.004614</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8002</th>\n",
       "      <td>5.279096</td>\n",
       "      <td>5.458030</td>\n",
       "      <td>4.123039</td>\n",
       "      <td>9.860768</td>\n",
       "      <td>2.441075</td>\n",
       "      <td>-1.028213</td>\n",
       "      <td>-0.790346</td>\n",
       "      <td>-0.622516</td>\n",
       "      <td>0.462567</td>\n",
       "      <td>0.287156</td>\n",
       "      <td>0.252946</td>\n",
       "      <td>0.663104</td>\n",
       "      <td>0.021423</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8003</th>\n",
       "      <td>1.596736</td>\n",
       "      <td>5.744044</td>\n",
       "      <td>5.888295</td>\n",
       "      <td>2.434392</td>\n",
       "      <td>3.762364</td>\n",
       "      <td>-1.019351</td>\n",
       "      <td>-0.869846</td>\n",
       "      <td>-1.873167</td>\n",
       "      <td>0.769447</td>\n",
       "      <td>0.733218</td>\n",
       "      <td>0.096916</td>\n",
       "      <td>0.159050</td>\n",
       "      <td>-0.033336</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8004</th>\n",
       "      <td>7.214450</td>\n",
       "      <td>2.265906</td>\n",
       "      <td>3.889059</td>\n",
       "      <td>9.012663</td>\n",
       "      <td>3.675266</td>\n",
       "      <td>-0.722557</td>\n",
       "      <td>-1.249246</td>\n",
       "      <td>-1.703463</td>\n",
       "      <td>0.837425</td>\n",
       "      <td>0.599088</td>\n",
       "      <td>0.975245</td>\n",
       "      <td>0.772472</td>\n",
       "      <td>0.061052</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9995</th>\n",
       "      <td>2.930406</td>\n",
       "      <td>9.487627</td>\n",
       "      <td>2.376523</td>\n",
       "      <td>6.187797</td>\n",
       "      <td>3.343416</td>\n",
       "      <td>-0.658054</td>\n",
       "      <td>-1.449106</td>\n",
       "      <td>-1.236256</td>\n",
       "      <td>0.601709</td>\n",
       "      <td>0.779642</td>\n",
       "      <td>0.813512</td>\n",
       "      <td>0.608385</td>\n",
       "      <td>0.023892</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9996</th>\n",
       "      <td>3.392299</td>\n",
       "      <td>1.274827</td>\n",
       "      <td>2.954947</td>\n",
       "      <td>6.894759</td>\n",
       "      <td>4.349512</td>\n",
       "      <td>-1.663661</td>\n",
       "      <td>-0.952437</td>\n",
       "      <td>-1.733414</td>\n",
       "      <td>0.502079</td>\n",
       "      <td>0.567242</td>\n",
       "      <td>0.285880</td>\n",
       "      <td>0.366120</td>\n",
       "      <td>-0.025803</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9997</th>\n",
       "      <td>2.364034</td>\n",
       "      <td>2.842030</td>\n",
       "      <td>8.776391</td>\n",
       "      <td>1.008906</td>\n",
       "      <td>4.299976</td>\n",
       "      <td>-1.380719</td>\n",
       "      <td>-0.943884</td>\n",
       "      <td>-1.975373</td>\n",
       "      <td>0.487838</td>\n",
       "      <td>0.986505</td>\n",
       "      <td>0.149286</td>\n",
       "      <td>0.145984</td>\n",
       "      <td>-0.031810</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9998</th>\n",
       "      <td>9.631511</td>\n",
       "      <td>3.994398</td>\n",
       "      <td>2.757071</td>\n",
       "      <td>7.821347</td>\n",
       "      <td>2.514755</td>\n",
       "      <td>-0.966330</td>\n",
       "      <td>-0.649915</td>\n",
       "      <td>-0.898510</td>\n",
       "      <td>0.365246</td>\n",
       "      <td>0.587558</td>\n",
       "      <td>0.889118</td>\n",
       "      <td>0.818391</td>\n",
       "      <td>0.037789</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9999</th>\n",
       "      <td>6.530527</td>\n",
       "      <td>6.781790</td>\n",
       "      <td>4.349695</td>\n",
       "      <td>8.673138</td>\n",
       "      <td>3.492807</td>\n",
       "      <td>-1.390285</td>\n",
       "      <td>-1.532193</td>\n",
       "      <td>-0.570329</td>\n",
       "      <td>0.073056</td>\n",
       "      <td>0.505441</td>\n",
       "      <td>0.378761</td>\n",
       "      <td>0.942631</td>\n",
       "      <td>0.045263</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2000 rows × 13 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          tau1      tau2      tau3      tau4        p1        p2        p3  \\\n",
       "8000  5.306905  2.452792  5.414825  4.964973  2.853706 -0.952709 -1.391630   \n",
       "8001  7.745244  4.311693  7.893386  0.917804  3.457962 -1.425012 -1.291345   \n",
       "8002  5.279096  5.458030  4.123039  9.860768  2.441075 -1.028213 -0.790346   \n",
       "8003  1.596736  5.744044  5.888295  2.434392  3.762364 -1.019351 -0.869846   \n",
       "8004  7.214450  2.265906  3.889059  9.012663  3.675266 -0.722557 -1.249246   \n",
       "...        ...       ...       ...       ...       ...       ...       ...   \n",
       "9995  2.930406  9.487627  2.376523  6.187797  3.343416 -0.658054 -1.449106   \n",
       "9996  3.392299  1.274827  2.954947  6.894759  4.349512 -1.663661 -0.952437   \n",
       "9997  2.364034  2.842030  8.776391  1.008906  4.299976 -1.380719 -0.943884   \n",
       "9998  9.631511  3.994398  2.757071  7.821347  2.514755 -0.966330 -0.649915   \n",
       "9999  6.530527  6.781790  4.349695  8.673138  3.492807 -1.390285 -1.532193   \n",
       "\n",
       "            p4        g1        g2        g3        g4      stab  \n",
       "8000 -0.509366  0.160440  0.958669  0.867021  0.183520  0.026496  \n",
       "8001 -0.741605  0.576198  0.851929  0.172012  0.788637 -0.004614  \n",
       "8002 -0.622516  0.462567  0.287156  0.252946  0.663104  0.021423  \n",
       "8003 -1.873167  0.769447  0.733218  0.096916  0.159050 -0.033336  \n",
       "8004 -1.703463  0.837425  0.599088  0.975245  0.772472  0.061052  \n",
       "...        ...       ...       ...       ...       ...       ...  \n",
       "9995 -1.236256  0.601709  0.779642  0.813512  0.608385  0.023892  \n",
       "9996 -1.733414  0.502079  0.567242  0.285880  0.366120 -0.025803  \n",
       "9997 -1.975373  0.487838  0.986505  0.149286  0.145984 -0.031810  \n",
       "9998 -0.898510  0.365246  0.587558  0.889118  0.818391  0.037789  \n",
       "9999 -0.570329  0.073056  0.505441  0.378761  0.942631  0.045263  \n",
       "\n",
       "[2000 rows x 13 columns]"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Save class values for train and test sets\n",
    "train_labels = train_data['stabf'].to_numpy()\n",
    "test_labels = test_data['stabf'].to_numpy()\n",
    "\n",
    "# Drop class column from train and test sets\n",
    "train = train_data.drop('stabf', axis=1)\n",
    "test = test_data.drop('stabf', axis=1)\n",
    "test"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "9857c37b",
   "metadata": {
    "column": 3,
    "index": 19
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[ 5.30690458e+00,  2.45279249e+00,  5.41482459e+00, ...,\n",
       "         8.67021410e-01,  1.83519882e-01,  2.64962906e-02],\n",
       "       [ 7.74524391e+00,  4.31169345e+00,  7.89338602e+00, ...,\n",
       "         1.72011877e-01,  7.88636816e-01, -4.61427241e-03],\n",
       "       [ 5.27909591e+00,  5.45802967e+00,  4.12303948e+00, ...,\n",
       "         2.52945554e-01,  6.63103928e-01,  2.14226453e-02],\n",
       "       ...,\n",
       "       [ 2.36403419e+00,  2.84203025e+00,  8.77639096e+00, ...,\n",
       "         1.49286458e-01,  1.45984032e-01, -3.18098881e-02],\n",
       "       [ 9.63151069e+00,  3.99439760e+00,  2.75707093e+00, ...,\n",
       "         8.89118346e-01,  8.18391326e-01,  3.77888091e-02],\n",
       "       [ 6.53052662e+00,  6.78178990e+00,  4.34969522e+00, ...,\n",
       "         3.78760930e-01,  9.42630833e-01,  4.52633082e-02]])"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Convert train and test to numpy arrays\n",
    "train = train.to_numpy()\n",
    "test = test.to_numpy()\n",
    "test"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "6cbbab41",
   "metadata": {
    "column": 3,
    "index": 20
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[ 6.39588195,  7.80684936,  7.1736136 , ...,  9.22110562,\n",
       "         6.16111504,  3.50595046],\n",
       "       [ 3.92085128,  7.64151855, 10.30036779, ..., 11.94195104,\n",
       "         8.36223921,  5.99341579],\n",
       "       [ 9.29110844,  9.5060078 ,  4.99855722, ...,  5.72491318,\n",
       "         9.68261024,  8.15986122],\n",
       "       ...,\n",
       "       [ 5.19825475,  7.64295322, 11.82678916, ..., 11.25359651,\n",
       "         8.97047589,  4.66049535],\n",
       "       [ 9.7621717 , 10.75797324,  5.25276363, ..., 10.17725321,\n",
       "         8.12872306,  8.60682185],\n",
       "       [ 8.05260679,  8.58839637,  4.13559361, ...,  5.74372075,\n",
       "         9.38195329,  8.1618491 ]])"
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Calculate the Euclidean distances using 1 loop\n",
    "num_test = test.shape[0]\n",
    "num_train = train.shape[0]\n",
    "dists = np.zeros((num_test, num_train))\n",
    "for i in range(num_test):\n",
    "    test_point = test[i]\n",
    "    subtraction_matrix_1l = train - test_point\n",
    "    squared_matrix_1l = np.square(subtraction_matrix_1l)\n",
    "    sum_of_squares_vector = np.sum(squared_matrix_1l, axis=1)\n",
    "    distances_vector = np.sqrt(sum_of_squares_vector)\n",
    "    # Store the distances in the distance matrix\n",
    "    dists[i] = distances_vector\n",
    "dists"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "7a2a277f",
   "metadata": {
    "column": 3,
    "index": 21
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([1., 1., 1., ..., 0., 1., 1.])"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Make predictions using k nearest neighbors\n",
    "\n",
    "k = 23\n",
    "num_test = dists.shape[0]\n",
    "y_pred = np.zeros(num_test)\n",
    "for i in range(num_test):\n",
    "    nearest_neighbors_indices = np.argsort(dists[i])\n",
    "    closest_y = np.zeros(k)\n",
    "    for m in range(k):\n",
    "        closest_y[m] = train_labels[nearest_neighbors_indices[m]]\n",
    "    labels = []\n",
    "    label_counts = []\n",
    "    for label in closest_y:\n",
    "        if label not in labels:\n",
    "          labels.append(label)\n",
    "          label_counts.append(1)\n",
    "        else:\n",
    "          label_counts[labels.index(label)] = label_counts[labels.index(label)] + 1\n",
    "    mode_labels = np.argsort(label_counts)[::-1]\n",
    "    y_pred[i] = labels[mode_labels[0]]\n",
    "y_pred"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "bdb48ddd",
   "metadata": {
    "column": 3,
    "index": 22
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Got 1566 / 2000 correct => accuracy: 0.783000\n"
     ]
    }
   ],
   "source": [
    "# Compute and print the fraction of correctly predicted examples\n",
    "num_correct = np.sum(y_pred == test_labels)\n",
    "accuracy = float(num_correct) / num_test\n",
    "print('Got %d / %d correct => accuracy: %f' % (num_correct, num_test, accuracy))"
   ]
  }
 ],
 "metadata": {
  "columns": 3,
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.1"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
