{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "0c47c369",
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "sys.path.insert(0, '../Results')\n",
    "sys.path.insert(0, '../../../src')\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import pickle\n",
    "import os\n",
    "from visualization import perc, SetPlotRC, ApplyFont\n",
    "from itertools import product"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "7d6309a3",
   "metadata": {},
   "source": [
    "# CorInfoMax"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "893334f8",
   "metadata": {},
   "source": [
    "## MNIST Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "5ae6edbb",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "3.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC</th>\n",
       "      <th>Tst_ACC</th>\n",
       "      <th>Trn_ACC_std</th>\n",
       "      <th>Tst_ACC_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.989155</td>\n",
       "      <td>0.97613</td>\n",
       "      <td>0.000575</td>\n",
       "      <td>0.001077</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.989195</td>\n",
       "      <td>0.97610</td>\n",
       "      <td>0.000386</td>\n",
       "      <td>0.000992</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>0.989307</td>\n",
       "      <td>0.97622</td>\n",
       "      <td>0.000493</td>\n",
       "      <td>0.001207</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>0.989295</td>\n",
       "      <td>0.97622</td>\n",
       "      <td>0.000417</td>\n",
       "      <td>0.000991</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>0.987767</td>\n",
       "      <td>0.97424</td>\n",
       "      <td>0.001131</td>\n",
       "      <td>0.001822</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>0.931058</td>\n",
       "      <td>0.91941</td>\n",
       "      <td>0.180652</td>\n",
       "      <td>0.175128</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>0.934550</td>\n",
       "      <td>0.92247</td>\n",
       "      <td>0.169365</td>\n",
       "      <td>0.164016</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>0.987168</td>\n",
       "      <td>0.97320</td>\n",
       "      <td>0.002661</td>\n",
       "      <td>0.003601</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number   Trn_ACC  Tst_ACC  Trn_ACC_std  Tst_ACC_std\n",
       "0               1  0.989155  0.97613     0.000575     0.001077\n",
       "1               2  0.989195  0.97610     0.000386     0.000992\n",
       "2               3  0.989307  0.97622     0.000493     0.001207\n",
       "3               4  0.989295  0.97622     0.000417     0.000991\n",
       "4               5  0.987767  0.97424     0.001131     0.001822\n",
       "5               6  0.931058  0.91941     0.180652     0.175128\n",
       "6               7  0.934550  0.92247     0.169365     0.164016\n",
       "7               8  0.987168  0.97320     0.002661     0.003601"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMax_MNIST_V1.pkl\")\n",
    "\n",
    "df_results['Trn_ACC'] = df_results.apply(lambda row: row['Trn_ACC_list'][-1], axis = 1)\n",
    "df_results['Tst_ACC'] = df_results.apply(lambda row: row['Tst_ACC_list'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std', 'Tst_ACC_std']] = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').std().reset_index()[['Trn_ACC', 'Tst_ACC']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC'].argmax()]['setting_number']\n",
    "print(best_setting) \n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "36545176",
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.15])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.15])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 3\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.15])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 4\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.15])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 5\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.15])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 6\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.15])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 7\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.15])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 8\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.15])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [784, 500, 10]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_ = 0.99999\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "lr_start_list = [{'ff' : np.array([1.0, 0.7]), 'fb': np.array([0.15, 0.15])}]\n",
    "lr_decay_multiplier_list = [0.95, 0.99]\n",
    "neural_lr_start_list = [0.05]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"divide_by_slow_loop_index\", \"constant\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 10\n",
    "neural_dynamic_iterations_free_list = [30]\n",
    "hopfield_g_list = [0.5, 0.2]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "\n",
    "setting_number = 0\n",
    "for lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"architecture\" : architecture,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "1d5bdec1",
   "metadata": {},
   "source": [
    "# MNIST 3 Layers"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "33273bd8",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "3\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC</th>\n",
       "      <th>Tst_ACC</th>\n",
       "      <th>Trn_ACC_std</th>\n",
       "      <th>Tst_ACC_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.989412</td>\n",
       "      <td>0.97552</td>\n",
       "      <td>0.000380</td>\n",
       "      <td>0.001333</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.989470</td>\n",
       "      <td>0.97520</td>\n",
       "      <td>0.000267</td>\n",
       "      <td>0.000926</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>0.989977</td>\n",
       "      <td>0.97583</td>\n",
       "      <td>0.000301</td>\n",
       "      <td>0.000723</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>0.990047</td>\n",
       "      <td>0.97551</td>\n",
       "      <td>0.000314</td>\n",
       "      <td>0.000857</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number   Trn_ACC  Tst_ACC  Trn_ACC_std  Tst_ACC_std\n",
       "0               1  0.989412  0.97552     0.000380     0.001333\n",
       "1               2  0.989470  0.97520     0.000267     0.000926\n",
       "2               3  0.989977  0.97583     0.000301     0.000723\n",
       "3               4  0.990047  0.97551     0.000314     0.000857"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMax_MNIST_3Layers_V1.pkl\")\n",
    "\n",
    "df_results['Trn_ACC'] = df_results.apply(lambda row: row['Trn_ACC_list'][-1], axis = 1)\n",
    "df_results['Tst_ACC'] = df_results.apply(lambda row: row['Tst_ACC_list'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std', 'Tst_ACC_std']] = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').std().reset_index()[['Trn_ACC', 'Tst_ACC']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC'].argmax()]['setting_number']\n",
    "best_setting = 3\n",
    "print(best_setting) \n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "63206414",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1.1 , 0.75, 0.6 ]), 'fb': array([ nan, 0.17, 0.07])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1.1 , 0.75, 0.6 ]), 'fb': array([ nan, 0.17, 0.07])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 3\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1.1 , 0.75, 0.6 ]), 'fb': array([ nan, 0.17, 0.07])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 4\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1.1 , 0.75, 0.6 ]), 'fb': array([ nan, 0.17, 0.07])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 500, 10]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [784, 500, 500, 10]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_ = 0.99999\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "lr_start_list = [{'ff' : np.array([1.1, 0.75, 0.6]), 'fb': np.array([np.nan, 0.17, 0.07])}]\n",
    "lr_decay_multiplier_list = [0.95]\n",
    "neural_lr_start_list = [0.05]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"divide_by_slow_loop_index\", \"constant\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 10\n",
    "neural_dynamic_iterations_free_list = [30]\n",
    "hopfield_g_list = [0.5, 0.2]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "\n",
    "setting_number = 0\n",
    "for lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"architecture\" : architecture,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "6406595d",
   "metadata": {},
   "source": [
    "## Fashion MNIST Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "23b60cfb",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC</th>\n",
       "      <th>Tst_ACC</th>\n",
       "      <th>Trn_ACC_std</th>\n",
       "      <th>Tst_ACC_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.914685</td>\n",
       "      <td>0.88138</td>\n",
       "      <td>0.002203</td>\n",
       "      <td>0.002773</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.912300</td>\n",
       "      <td>0.88140</td>\n",
       "      <td>0.001062</td>\n",
       "      <td>0.001562</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>0.899613</td>\n",
       "      <td>0.87215</td>\n",
       "      <td>0.027887</td>\n",
       "      <td>0.023662</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>0.905308</td>\n",
       "      <td>0.87770</td>\n",
       "      <td>0.001197</td>\n",
       "      <td>0.002255</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number   Trn_ACC  Tst_ACC  Trn_ACC_std  Tst_ACC_std\n",
       "0               1  0.914685  0.88138     0.002203     0.002773\n",
       "1               2  0.912300  0.88140     0.001062     0.001562\n",
       "2               3  0.899613  0.87215     0.027887     0.023662\n",
       "3               4  0.905308  0.87770     0.001197     0.002255"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMax_FashionMNIST_V1.pkl\")\n",
    "\n",
    "df_results['Trn_ACC'] = df_results.apply(lambda row: row['Trn_ACC_list'][-1], axis = 1)\n",
    "df_results['Tst_ACC'] = df_results.apply(lambda row: row['Tst_ACC_list'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std', 'Tst_ACC_std']] = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').std().reset_index()[['Trn_ACC', 'Tst_ACC']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC'].argmax()]['setting_number']\n",
    "print(best_setting) \n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "d85e2a23",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.3 , 0.22]), 'fb': array([ nan, 0.07])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.07\n",
      "hopfield_g 0.3\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.3 , 0.22]), 'fb': array([ nan, 0.07])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.3\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 3\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.25, 0.15]), 'fb': array([0.15, 0.09])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.07\n",
      "hopfield_g 0.3\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 4\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.25, 0.15]), 'fb': array([0.15, 0.09])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.3\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [784, 500, 10]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [784, 500, 10]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_ = 0.99999\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "lr_start_list = [{'ff' : np.array([0.3, 0.22]), 'fb': np.array([np.nan, 0.07])}, {'ff' : np.array([0.25, 0.15]), 'fb': np.array([0.15, 0.09])}]\n",
    "lr_decay_multiplier_list = [0.95]\n",
    "neural_lr_start_list = [0.07, 0.05]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"divide_by_slow_loop_index\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 10\n",
    "neural_dynamic_iterations_free_list = [30]\n",
    "hopfield_g_list = [0.3]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "\n",
    "setting_number = 0\n",
    "for lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"architecture\" : architecture,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "bc4c9b43",
   "metadata": {},
   "source": [
    "## CIFAR10 Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "34e7edf0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "3.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC</th>\n",
       "      <th>Tst_ACC</th>\n",
       "      <th>Trn_ACC_std</th>\n",
       "      <th>Tst_ACC_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.648406</td>\n",
       "      <td>0.51732</td>\n",
       "      <td>0.001741</td>\n",
       "      <td>0.003437</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.624266</td>\n",
       "      <td>0.51065</td>\n",
       "      <td>0.001146</td>\n",
       "      <td>0.003666</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>0.648484</td>\n",
       "      <td>0.51856</td>\n",
       "      <td>0.001553</td>\n",
       "      <td>0.003349</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>0.624564</td>\n",
       "      <td>0.51066</td>\n",
       "      <td>0.001796</td>\n",
       "      <td>0.003228</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number   Trn_ACC  Tst_ACC  Trn_ACC_std  Tst_ACC_std\n",
       "0               1  0.648406  0.51732     0.001741     0.003437\n",
       "1               2  0.624266  0.51065     0.001146     0.003666\n",
       "2               3  0.648484  0.51856     0.001553     0.003349\n",
       "3               4  0.624564  0.51066     0.001796     0.003228"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMax_CIFAR10_V1.pkl\")\n",
    "\n",
    "df_results['Trn_ACC'] = df_results.apply(lambda row: row['Trn_ACC_list'][-1], axis = 1)\n",
    "df_results['Tst_ACC'] = df_results.apply(lambda row: row['Tst_ACC_list'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std', 'Tst_ACC_std']] = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').std().reset_index()[['Trn_ACC', 'Tst_ACC']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC'].argmax()]['setting_number']\n",
    "print(best_setting) \n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "286d6fe2",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.08, 0.04]), 'fb': array([ nan, 0.04])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 1000, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.07, 0.03]), 'fb': array([ nan, 0.05])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 1000, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 3\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.08, 0.04]), 'fb': array([ nan, 0.04])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99995\n",
      "architecture [3072, 1000, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 4\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.07, 0.03]), 'fb': array([ nan, 0.05])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99995\n",
      "architecture [3072, 1000, 10]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [int(32*32*3), 1000, 10]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_list = [0.99999, 0.99995]\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "lr_start_list = [{'ff' : np.array([0.08, 0.04]), 'fb': np.array([np.nan, 0.04])}, {'ff' : np.array([0.07, 0.03]), 'fb': np.array([np.nan, 0.05])}]\n",
    "lr_decay_multiplier_list = [0.95]\n",
    "neural_lr_start_list = [0.05]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"constant\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 10\n",
    "neural_dynamic_iterations_free_list = [30]\n",
    "hopfield_g_list = [0.1]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "setting_number = 0\n",
    "for lambda_, lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lambda_list, lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"architecture\" : architecture,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "ac0c6429",
   "metadata": {},
   "source": [
    "# CIFAR10 3 Layers"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "51c1dbbe",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC</th>\n",
       "      <th>Tst_ACC</th>\n",
       "      <th>Trn_ACC_std</th>\n",
       "      <th>Tst_ACC_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.587254</td>\n",
       "      <td>0.50968</td>\n",
       "      <td>0.003554</td>\n",
       "      <td>0.003769</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.574836</td>\n",
       "      <td>0.49911</td>\n",
       "      <td>0.061825</td>\n",
       "      <td>0.032709</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number   Trn_ACC  Tst_ACC  Trn_ACC_std  Tst_ACC_std\n",
       "0               1  0.587254  0.50968     0.003554     0.003769\n",
       "1               2  0.574836  0.49911     0.061825     0.032709"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMax_CIFAR10_3Layers_V1.pkl\")\n",
    "\n",
    "df_results['Trn_ACC'] = df_results.apply(lambda row: row['Trn_ACC_list'][-1], axis = 1)\n",
    "df_results['Tst_ACC'] = df_results.apply(lambda row: row['Tst_ACC_list'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std', 'Tst_ACC_std']] = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').std().reset_index()[['Trn_ACC', 'Tst_ACC']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC'].argmax()]['setting_number']\n",
    "print(best_setting) \n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "efadaf30",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.11 , 0.06 , 0.035]), 'fb': array([  nan, 0.045, 0.015])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 1000, 500, 10]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.13 , 0.07 , 0.035]), 'fb': array([  nan, 0.045, 0.012])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 1000, 500, 10]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [int(32*32*3), 1000, 500, 10]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_list = [0.99999]\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "lr_start_list = [{'ff': np.array([0.11, 0.06, 0.035]), 'fb': np.array([ np.nan, 0.045, 0.015])}, {'ff': np.array([0.13, 0.07, 0.035]), 'fb': np.array([ np.nan, 0.045, 0.012])}]\n",
    "lr_decay_multiplier_list = [0.95]\n",
    "neural_lr_start_list = [0.05]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"constant\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 10\n",
    "neural_dynamic_iterations_free_list = [30]\n",
    "hopfield_g_list = [0.1]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "setting_number = 0\n",
    "for lambda_, lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lambda_list, lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"architecture\" : architecture,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "c361667e",
   "metadata": {},
   "source": [
    "## CIFAR100 Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "ea4be26d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(27, 7)\n",
      "3.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC_top1</th>\n",
       "      <th>Tst_ACC_top1</th>\n",
       "      <th>Trn_ACC_top5</th>\n",
       "      <th>Tst_ACC_top5</th>\n",
       "      <th>Trn_ACC_std_top1</th>\n",
       "      <th>Tst_ACC_std_top1</th>\n",
       "      <th>Trn_ACC_std_top5</th>\n",
       "      <th>Tst_ACC_std_top5</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.238840</td>\n",
       "      <td>0.190550</td>\n",
       "      <td>0.409152</td>\n",
       "      <td>0.364140</td>\n",
       "      <td>0.004513</td>\n",
       "      <td>0.003147</td>\n",
       "      <td>0.005345</td>\n",
       "      <td>0.005225</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.239074</td>\n",
       "      <td>0.190720</td>\n",
       "      <td>0.409522</td>\n",
       "      <td>0.364570</td>\n",
       "      <td>0.004011</td>\n",
       "      <td>0.001885</td>\n",
       "      <td>0.004720</td>\n",
       "      <td>0.004361</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>0.256129</td>\n",
       "      <td>0.200814</td>\n",
       "      <td>0.421534</td>\n",
       "      <td>0.372243</td>\n",
       "      <td>0.003463</td>\n",
       "      <td>0.001490</td>\n",
       "      <td>0.006293</td>\n",
       "      <td>0.004897</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number  Trn_ACC_top1  Tst_ACC_top1  Trn_ACC_top5  Tst_ACC_top5  \\\n",
       "0               1      0.238840      0.190550      0.409152      0.364140   \n",
       "1               2      0.239074      0.190720      0.409522      0.364570   \n",
       "2               3      0.256129      0.200814      0.421534      0.372243   \n",
       "\n",
       "   Trn_ACC_std_top1  Tst_ACC_std_top1  Trn_ACC_std_top5  Tst_ACC_std_top5  \n",
       "0          0.004513          0.003147          0.005345          0.005225  \n",
       "1          0.004011          0.001885          0.004720          0.004361  \n",
       "2          0.003463          0.001490          0.006293          0.004897  "
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMax_CIFAR100_V2.pkl\")\n",
    "print(df_results.shape)\n",
    "df_results['Trn_ACC_list_top1'] = df_results.apply(lambda row: np.array(row['Trn_ACC_list'])[:,0], axis = 1)\n",
    "df_results['Trn_ACC_list_top5'] = df_results.apply(lambda row: np.array(row['Trn_ACC_list'])[:,1], axis = 1)\n",
    "df_results['Tst_ACC_list_top1'] = df_results.apply(lambda row: np.array(row['Tst_ACC_list'])[:,0], axis = 1)\n",
    "df_results['Tst_ACC_list_top5'] = df_results.apply(lambda row: np.array(row['Tst_ACC_list'])[:,1], axis = 1)\n",
    "\n",
    "df_results['Trn_ACC_top1'] = df_results.apply(lambda row: row['Trn_ACC_list_top1'][-1], axis = 1)\n",
    "df_results['Trn_ACC_top5'] = df_results.apply(lambda row: row['Trn_ACC_list_top5'][-1], axis = 1)\n",
    "df_results['Tst_ACC_top1'] = df_results.apply(lambda row: row['Tst_ACC_list_top1'][-1], axis = 1)\n",
    "df_results['Tst_ACC_top5'] = df_results.apply(lambda row: row['Tst_ACC_list_top5'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC_top1', 'Tst_ACC_top1', 'Trn_ACC_top5', 'Tst_ACC_top5']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std_top1', 'Tst_ACC_std_top1', 'Trn_ACC_std_top5', 'Tst_ACC_std_top5']] = df_results[['setting_number', 'Trn_ACC_top1', 'Tst_ACC_top1', 'Trn_ACC_top5', 'Tst_ACC_top5']].groupby('setting_number').std().reset_index()[['Trn_ACC_top1', 'Tst_ACC_top1', 'Trn_ACC_top5', 'Tst_ACC_top5']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC_top1'].argmax()]['setting_number']\n",
    "print(best_setting)\n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "62050ba0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.16, 0.13, 0.08]), 'fb': array([ nan, 0.06, 0.04])}\n",
      "lr_decay_multiplier 1.0\n",
      "neural_dynamic_iterations_free 50\n",
      "neural_dynamic_iterations_nudged 20\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.06\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 2000, 1000, 100]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.16, 0.13, 0.08]), 'fb': array([ nan, 0.06, 0.04])}\n",
      "lr_decay_multiplier 1.0\n",
      "neural_dynamic_iterations_free 60\n",
      "neural_dynamic_iterations_nudged 20\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.06\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 2000, 1000, 100]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 3\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.18, 0.15, 0.09]), 'fb': array([ nan, 0.08, 0.06])}\n",
      "lr_decay_multiplier 1.0\n",
      "neural_dynamic_iterations_free 50\n",
      "neural_dynamic_iterations_nudged 20\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.06\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 2000, 1000, 100]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 4\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.18, 0.15, 0.09]), 'fb': array([ nan, 0.08, 0.06])}\n",
      "lr_decay_multiplier 1.0\n",
      "neural_dynamic_iterations_free 60\n",
      "neural_dynamic_iterations_nudged 20\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.06\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 2000, 1000, 100]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [int(32*32*3), 2000, 1000, 100]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_list = [0.99999]\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "# lr_start_list = [{'ff' : np.array([0.15, 0.06, 0.04]), 'fb': np.array([np.nan, 0.03, 0.01])}, {'ff' : np.array([0.16, 0.08, 0.05]), 'fb': np.array([np.nan, 0.04, 0.02])}]\n",
    "lr_start_list = [{'ff' : np.array([0.16, 0.13, 0.08]), 'fb': np.array([np.nan, 0.06, 0.04])}, {'ff' : np.array([0.18, 0.15, 0.09]), 'fb': np.array([np.nan, 0.08, 0.06])}]\n",
    "lr_decay_multiplier_list = [1.0]\n",
    "neural_lr_start_list = [0.06]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"constant\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 20\n",
    "neural_dynamic_iterations_free_list = [50, 60]\n",
    "hopfield_g_list = [0.1]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "\n",
    "setting_number = 0\n",
    "for lambda_, lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lambda_list, lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"architecture\" : architecture,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "0f30ac38",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(20, 7)\n",
      "2.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC_top1</th>\n",
       "      <th>Tst_ACC_top1</th>\n",
       "      <th>Trn_ACC_top5</th>\n",
       "      <th>Tst_ACC_top5</th>\n",
       "      <th>Trn_ACC_std_top1</th>\n",
       "      <th>Tst_ACC_std_top1</th>\n",
       "      <th>Trn_ACC_std_top5</th>\n",
       "      <th>Tst_ACC_std_top5</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.259518</td>\n",
       "      <td>0.20199</td>\n",
       "      <td>0.428228</td>\n",
       "      <td>0.37599</td>\n",
       "      <td>0.003396</td>\n",
       "      <td>0.002035</td>\n",
       "      <td>0.004845</td>\n",
       "      <td>0.002771</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.277310</td>\n",
       "      <td>0.20841</td>\n",
       "      <td>0.435044</td>\n",
       "      <td>0.37861</td>\n",
       "      <td>0.005005</td>\n",
       "      <td>0.004277</td>\n",
       "      <td>0.009238</td>\n",
       "      <td>0.007969</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number  Trn_ACC_top1  Tst_ACC_top1  Trn_ACC_top5  Tst_ACC_top5  \\\n",
       "0               1      0.259518       0.20199      0.428228       0.37599   \n",
       "1               2      0.277310       0.20841      0.435044       0.37861   \n",
       "\n",
       "   Trn_ACC_std_top1  Tst_ACC_std_top1  Trn_ACC_std_top5  Tst_ACC_std_top5  \n",
       "0          0.003396          0.002035          0.004845          0.002771  \n",
       "1          0.005005          0.004277          0.009238          0.007969  "
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMax_CIFAR100_V3.pkl\")\n",
    "print(df_results.shape)\n",
    "df_results['Trn_ACC_list_top1'] = df_results.apply(lambda row: np.array(row['Trn_ACC_list'])[:,0], axis = 1)\n",
    "df_results['Trn_ACC_list_top5'] = df_results.apply(lambda row: np.array(row['Trn_ACC_list'])[:,1], axis = 1)\n",
    "df_results['Tst_ACC_list_top1'] = df_results.apply(lambda row: np.array(row['Tst_ACC_list'])[:,0], axis = 1)\n",
    "df_results['Tst_ACC_list_top5'] = df_results.apply(lambda row: np.array(row['Tst_ACC_list'])[:,1], axis = 1)\n",
    "\n",
    "df_results['Trn_ACC_top1'] = df_results.apply(lambda row: row['Trn_ACC_list_top1'][-1], axis = 1)\n",
    "df_results['Trn_ACC_top5'] = df_results.apply(lambda row: row['Trn_ACC_list_top5'][-1], axis = 1)\n",
    "df_results['Tst_ACC_top1'] = df_results.apply(lambda row: row['Tst_ACC_list_top1'][-1], axis = 1)\n",
    "df_results['Tst_ACC_top5'] = df_results.apply(lambda row: row['Tst_ACC_list_top5'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC_top1', 'Tst_ACC_top1', 'Trn_ACC_top5', 'Tst_ACC_top5']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std_top1', 'Tst_ACC_std_top1', 'Trn_ACC_std_top5', 'Tst_ACC_std_top5']] = df_results[['setting_number', 'Trn_ACC_top1', 'Tst_ACC_top1', 'Trn_ACC_top5', 'Tst_ACC_top5']].groupby('setting_number').std().reset_index()[['Trn_ACC_top1', 'Tst_ACC_top1', 'Trn_ACC_top5', 'Tst_ACC_top5']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC_top1'].argmax()]['setting_number']\n",
    "print(best_setting)\n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "7542f2c2",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.16, 0.13, 0.08]), 'fb': array([ nan, 0.06, 0.04])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 50\n",
      "neural_dynamic_iterations_nudged 20\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.06\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 2000, 1000, 100]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.18, 0.15, 0.09]), 'fb': array([ nan, 0.08, 0.06])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 50\n",
      "neural_dynamic_iterations_nudged 20\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.06\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "architecture [3072, 2000, 1000, 100]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [int(32*32*3), 2000, 1000, 100]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_list = [0.99999]\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "# lr_start_list = [{'ff' : np.array([0.15, 0.06, 0.04]), 'fb': np.array([np.nan, 0.03, 0.01])}, {'ff' : np.array([0.16, 0.08, 0.05]), 'fb': np.array([np.nan, 0.04, 0.02])}]\n",
    "lr_start_list = [{'ff' : np.array([0.16, 0.13, 0.08]), 'fb': np.array([np.nan, 0.06, 0.04])}, {'ff' : np.array([0.18, 0.15, 0.09]), 'fb': np.array([np.nan, 0.08, 0.06])}]\n",
    "lr_decay_multiplier_list = [0.99]\n",
    "neural_lr_start_list = [0.06]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"constant\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 20\n",
    "neural_dynamic_iterations_free_list = [50]\n",
    "hopfield_g_list = [0.1]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "\n",
    "setting_number = 0\n",
    "for lambda_, lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lambda_list, lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"architecture\" : architecture,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "f0b36a44",
   "metadata": {},
   "source": [
    "# CorInfoMax-Sparse"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "ee30bd76",
   "metadata": {},
   "source": [
    "## MNIST Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "ad800e86",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "3.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC</th>\n",
       "      <th>Tst_ACC</th>\n",
       "      <th>Trn_ACC_std</th>\n",
       "      <th>Tst_ACC_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.897933</td>\n",
       "      <td>0.88891</td>\n",
       "      <td>0.280817</td>\n",
       "      <td>0.277899</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.986342</td>\n",
       "      <td>0.97634</td>\n",
       "      <td>0.001277</td>\n",
       "      <td>0.001212</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>0.986983</td>\n",
       "      <td>0.97711</td>\n",
       "      <td>0.000604</td>\n",
       "      <td>0.000962</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>0.986957</td>\n",
       "      <td>0.97724</td>\n",
       "      <td>0.000457</td>\n",
       "      <td>0.000833</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number   Trn_ACC  Tst_ACC  Trn_ACC_std  Tst_ACC_std\n",
       "0               1  0.897933  0.88891     0.280817     0.277899\n",
       "1               2  0.986342  0.97634     0.001277     0.001212\n",
       "2               3  0.986983  0.97711     0.000604     0.000962\n",
       "3               4  0.986957  0.97724     0.000457     0.000833"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMaxSparse_MNIST_V1.pkl\")\n",
    "\n",
    "df_results['Trn_ACC'] = df_results.apply(lambda row: row['Trn_ACC_list'][-1], axis = 1)\n",
    "df_results['Tst_ACC'] = df_results.apply(lambda row: row['Tst_ACC_list'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std', 'Tst_ACC_std']] = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').std().reset_index()[['Trn_ACC', 'Tst_ACC']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC'].argmax()]['setting_number']\n",
    "print(best_setting) \n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "61747d94",
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.12])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 4\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.12])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 4\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 3\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.12])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 4\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 4\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.12])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 4\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 5\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.12])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 4\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 6\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.12])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 4\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 7\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.12])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 4\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.5\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 8\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([1. , 0.7]), 'fb': array([0.15, 0.12])}\n",
      "lr_decay_multiplier 0.99\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 4\n",
      "neural_lr_rule constant\n",
      "neural_lr 0.05\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [784, 500, 10]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_ = 0.99999\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "lr_start_list = [{'ff' : np.array([1.0, 0.7]), 'fb': np.array([0.15, 0.12])}]\n",
    "lr_decay_multiplier_list = [0.95, 0.99]\n",
    "neural_lr_start_list = [0.05]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"divide_by_slow_loop_index\", \"constant\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 4\n",
    "neural_dynamic_iterations_free_list = [20]\n",
    "hopfield_g_list = [0.5, 0.2]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "STlambda_lr_list = [1e-6, 0.01]\n",
    "sparse_layers = [1, 2]\n",
    "\n",
    "setting_number = 0\n",
    "for lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"STlambda_lr_list\": STlambda_lr_list, \n",
    "                        \"architecture\" : architecture, \"sparse_layers\": sparse_layers,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "14831e31",
   "metadata": {},
   "source": [
    "## Fashion MNIST Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "99bb78c4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC</th>\n",
       "      <th>Tst_ACC</th>\n",
       "      <th>Trn_ACC_std</th>\n",
       "      <th>Tst_ACC_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.899432</td>\n",
       "      <td>0.87177</td>\n",
       "      <td>0.029649</td>\n",
       "      <td>0.029271</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.908608</td>\n",
       "      <td>0.88091</td>\n",
       "      <td>0.001108</td>\n",
       "      <td>0.000814</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number   Trn_ACC  Tst_ACC  Trn_ACC_std  Tst_ACC_std\n",
       "0               1  0.899432  0.87177     0.029649     0.029271\n",
       "1               2  0.908608  0.88091     0.001108     0.000814"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMaxSparse_FashionMNIST_V1.pkl\")\n",
    "\n",
    "df_results['Trn_ACC'] = df_results.apply(lambda row: row['Trn_ACC_list'][-1], axis = 1)\n",
    "df_results['Tst_ACC'] = df_results.apply(lambda row: row['Tst_ACC_list'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std', 'Tst_ACC_std']] = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').std().reset_index()[['Trn_ACC', 'Tst_ACC']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC'].argmax()]['setting_number']\n",
    "print(best_setting) \n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "28c70785",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.35, 0.23]), 'fb': array([ nan, 0.06])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.045\n",
      "hopfield_g 0.3\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.35, 0.23]), 'fb': array([ nan, 0.06])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.045\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [784, 500, 10]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_ = 0.99999\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "lr_start_list = [{'ff' : np.array([0.35, 0.23]), 'fb': np.array([np.nan, 0.06])}]\n",
    "lr_decay_multiplier_list = [0.95]\n",
    "neural_lr_start_list = [0.045]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"divide_by_slow_loop_index\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 10\n",
    "neural_dynamic_iterations_free_list = [20]\n",
    "hopfield_g_list = [0.3, 0.2]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "STlambda_lr_list = [1e-6, 0.01]\n",
    "sparse_layers = [1, 2]\n",
    "\n",
    "setting_number = 0\n",
    "for lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"STlambda_lr_list\": STlambda_lr_list, \n",
    "                        \"architecture\" : architecture, \"sparse_layers\": sparse_layers,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "d52ff7b5",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC</th>\n",
       "      <th>Tst_ACC</th>\n",
       "      <th>Trn_ACC_std</th>\n",
       "      <th>Tst_ACC_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.900733</td>\n",
       "      <td>0.87233</td>\n",
       "      <td>0.029861</td>\n",
       "      <td>0.029585</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.900592</td>\n",
       "      <td>0.87257</td>\n",
       "      <td>0.029699</td>\n",
       "      <td>0.029517</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number   Trn_ACC  Tst_ACC  Trn_ACC_std  Tst_ACC_std\n",
       "0               1  0.900733  0.87233     0.029861     0.029585\n",
       "1               2  0.900592  0.87257     0.029699     0.029517"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMaxSparse_FashionMNIST_V3.pkl\")\n",
    "\n",
    "df_results['Trn_ACC'] = df_results.apply(lambda row: row['Trn_ACC_list'][-1], axis = 1)\n",
    "df_results['Tst_ACC'] = df_results.apply(lambda row: row['Tst_ACC_list'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std', 'Tst_ACC_std']] = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').std().reset_index()[['Trn_ACC', 'Tst_ACC']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC'].argmax()]['setting_number']\n",
    "print(best_setting) \n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "b4094829",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.35, 0.23]), 'fb': array([ nan, 0.06])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.045\n",
      "hopfield_g 0.3\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.35, 0.23]), 'fb': array([ nan, 0.06])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 20\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.045\n",
      "hopfield_g 0.2\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-06, 0.01]\n",
      "architecture [784, 500, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [784, 500, 10]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_ = 0.99999\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "lr_start_list = [{'ff' : np.array([0.35, 0.23]), 'fb': np.array([np.nan, 0.06])}]\n",
    "lr_decay_multiplier_list = [0.95]\n",
    "neural_lr_start_list = [0.045]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"divide_by_slow_loop_index\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 10\n",
    "neural_dynamic_iterations_free_list = [20]\n",
    "hopfield_g_list = [0.3, 0.2]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "STlambda_lr_list = [1e-6, 0.01]\n",
    "sparse_layers = [1, 2]\n",
    "\n",
    "setting_number = 0\n",
    "for lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"STlambda_lr_list\": STlambda_lr_list, \n",
    "                        \"architecture\" : architecture, \"sparse_layers\": sparse_layers,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "50436a3d",
   "metadata": {},
   "source": [
    "## CIFAR10 Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "48f51077",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2.0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>setting_number</th>\n",
       "      <th>Trn_ACC</th>\n",
       "      <th>Tst_ACC</th>\n",
       "      <th>Trn_ACC_std</th>\n",
       "      <th>Tst_ACC_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>0.630052</td>\n",
       "      <td>0.51047</td>\n",
       "      <td>0.004824</td>\n",
       "      <td>0.004038</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>0.637194</td>\n",
       "      <td>0.51188</td>\n",
       "      <td>0.005634</td>\n",
       "      <td>0.003585</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>0.630030</td>\n",
       "      <td>0.51062</td>\n",
       "      <td>0.005393</td>\n",
       "      <td>0.003209</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>0.637156</td>\n",
       "      <td>0.51106</td>\n",
       "      <td>0.005341</td>\n",
       "      <td>0.003796</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   setting_number   Trn_ACC  Tst_ACC  Trn_ACC_std  Tst_ACC_std\n",
       "0               1  0.630052  0.51047     0.004824     0.004038\n",
       "1               2  0.637194  0.51188     0.005634     0.003585\n",
       "2               3  0.630030  0.51062     0.005393     0.003209\n",
       "3               4  0.637156  0.51106     0.005341     0.003796"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_results = pd.read_pickle(r\"../Results/simulation_results_CorInfoMaxSparse_CIFAR10_V1.pkl\")\n",
    "\n",
    "df_results['Trn_ACC'] = df_results.apply(lambda row: row['Trn_ACC_list'][-1], axis = 1)\n",
    "df_results['Tst_ACC'] = df_results.apply(lambda row: row['Tst_ACC_list'][-1], axis = 1)\n",
    "\n",
    "df_setting = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').mean().reset_index()\n",
    "df_setting[['Trn_ACC_std', 'Tst_ACC_std']] = df_results[['setting_number', 'Trn_ACC', 'Tst_ACC']].groupby('setting_number').std().reset_index()[['Trn_ACC', 'Tst_ACC']]\n",
    "\n",
    "best_setting = df_setting.iloc[df_setting['Trn_ACC'].argmax()]['setting_number']\n",
    "print(best_setting) \n",
    "\n",
    "df_setting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "5817b39a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Setting Number : 1\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.09, 0.07]), 'fb': array([  nan, 0.045])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.025\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-05, 0.01]\n",
      "architecture [3072, 1000, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 2\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.095, 0.075]), 'fb': array([ nan, 0.05])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.025\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99999\n",
      "STlambda_lr_list [1e-05, 0.01]\n",
      "architecture [3072, 1000, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 3\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.09, 0.07]), 'fb': array([  nan, 0.045])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.025\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99995\n",
      "STlambda_lr_list [1e-05, 0.01]\n",
      "architecture [3072, 1000, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n",
      "\n",
      "Setting Number : 4\n",
      "Corresponding Hyperparameters:\n",
      "\n",
      "lr_start {'ff': array([0.095, 0.075]), 'fb': array([ nan, 0.05])}\n",
      "lr_decay_multiplier 0.95\n",
      "neural_dynamic_iterations_free 30\n",
      "neural_dynamic_iterations_nudged 10\n",
      "neural_lr_rule divide_by_slow_loop_index\n",
      "neural_lr 0.025\n",
      "hopfield_g 0.1\n",
      "epsilon 0.15\n",
      "lambda 0.99995\n",
      "STlambda_lr_list [1e-05, 0.01]\n",
      "architecture [3072, 1000, 10]\n",
      "sparse_layers [1, 2]\n",
      "three_phase False\n"
     ]
    }
   ],
   "source": [
    "architecture = [int(32*32*3), 1000, 10]\n",
    "############# HYPERPARAMS GRID SEARCH LISTS #########################\n",
    "beta = 1\n",
    "lambda_list = [0.99999, 0.99995]\n",
    "epsilon = 0.15\n",
    "one_over_epsilon = 1 / epsilon\n",
    "lr_start_list = [{'ff': np.array([0.09, 0.07]), 'fb': np.array([ np.nan, 0.045])}, {'ff': np.array([0.095, 0.075]), 'fb': np.array([ np.nan, 0.05])}]\n",
    "lr_decay_multiplier_list = [0.95]\n",
    "neural_lr_start_list = [0.025]\n",
    "neural_lr_stop = 0.001\n",
    "neural_lr_rule_list = [\"divide_by_slow_loop_index\"]\n",
    "neural_lr_decay_multiplier = 0.01\n",
    "neural_dynamic_iterations_nudged = 10\n",
    "neural_dynamic_iterations_free_list = [30]\n",
    "hopfield_g_list = [0.1]\n",
    "use_random_sign_beta = True\n",
    "use_three_phase_list = [False]\n",
    "STlambda_lr_list = [1*1e-5, 0.01]\n",
    "sparse_layers = [1, 2]\n",
    "\n",
    "setting_number = 0\n",
    "for lambda_, lr_start, lr_decay_multiplier, neural_lr_start, neural_lr_rule, neural_dynamic_iterations_free, hopfield_g, use_three_phase in product(lambda_list, lr_start_list, lr_decay_multiplier_list, neural_lr_start_list, neural_lr_rule_list, neural_dynamic_iterations_free_list, hopfield_g_list, use_three_phase_list):\n",
    "    setting_number += 1\n",
    "    hyperparams_dict = {\"lr_start\" : lr_start, \"lr_decay_multiplier\" : lr_decay_multiplier,\n",
    "                        \"neural_dynamic_iterations_free\" : neural_dynamic_iterations_free,\n",
    "                        \"neural_dynamic_iterations_nudged\" : neural_dynamic_iterations_nudged, \n",
    "                        \"neural_lr_rule\" : neural_lr_rule, \"neural_lr\" : neural_lr_start, \n",
    "                        \"hopfield_g\": hopfield_g, \"epsilon\" : epsilon, \"lambda\" : lambda_,\n",
    "                        \"STlambda_lr_list\": STlambda_lr_list, \n",
    "                        \"architecture\" : architecture, \"sparse_layers\": sparse_layers,\n",
    "                        \"three_phase\" : use_three_phase}\n",
    "    print(\"\\nSetting Number : {}\".format(setting_number))\n",
    "    print(\"Corresponding Hyperparameters:\\n\")\n",
    "    for x in hyperparams_dict:\n",
    "        print(x, hyperparams_dict[x])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "863f19c7",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "02b4b3a3",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
