{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Contrasting performance to multinomial logistic regression models\n",
    "\n",
    "> Last edit: August 1, 2022.\n",
    "\n",
    "----"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "import pickle\n",
    "import sys\n",
    "sys.path.append('../')\n",
    "#from TrainModels import models\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "from torch.utils.data import Dataset\n",
    "from torch.utils.data import DataLoader\n",
    "import numpy as np\n",
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Display table from Appendix J\n",
    "\n",
    "----"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "STORED_ERRORS_PATH = '/SavedErrors'\n",
    "\n",
    "# Load linear errors\n",
    "linear_core_MAE = torch.load(f'{STORED_ERRORS_PATH}MAEs_multinomial_logit_banzhaf')\n",
    "linear_shap_MAE = torch.load(f'{STORED_ERRORS_PATH}MAEs_multinomial_logit_shapley')\n",
    "linear_banz_MAE = torch.load(f'{STORED_ERRORS_PATH}MAEs_multinomial_logit_banzhaf')\n",
    "\n",
    "# Load neural network errors\n",
    "neural_shap = pd.read_csv(f'{STORED_ERRORS_PATH}df_shap')\n",
    "neural_banz = pd.read_csv(f'{STORED_ERRORS_PATH}df_banz')\n",
    "neural_core = pd.read_csv(f'{STORED_ERRORS_PATH}df_core')\n",
    "\n",
    "df_contrast_perf = pd.DataFrame({\n",
    "    'N'                     : np.arange(4, 21),\n",
    "    'Linear Core'           : linear_core_MAE.detach().numpy(),\n",
    "    'Neural net Core'       : neural_core.groupby('n_players')['MAE_payoffs'].mean().values,\n",
    "    'Linear Shapley'        : linear_shap_MAE.detach().numpy(),\n",
    "    'Neural net Shapley'    : neural_shap.groupby('n_players')['MAE_payoffs'].mean().values,\n",
    "    'Linear Banzhaf'        : linear_banz_MAE.detach().numpy(),\n",
    "    'Neural net Banzhaf'    : neural_banz.groupby('n_players')['MAE_payoffs'].mean().values,\n",
    "})\n",
    "\n",
    "table = df_contrast_perf.set_index('N')\n",
    "\n",
    "table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "metadata": {},
   "outputs": [],
   "source": [
    "# pd.options.display.float_format = \"{:,.3f}\".format\n",
    "\n",
    "# table = df_contrast_perf.set_index('N')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 87,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "N\n",
       "4    41.030\n",
       "5    57.526\n",
       "6    70.443\n",
       "7    77.524\n",
       "8    76.018\n",
       "9    76.619\n",
       "10   86.143\n",
       "11   77.626\n",
       "12   89.802\n",
       "13   88.542\n",
       "14   72.449\n",
       "15   63.578\n",
       "16   88.843\n",
       "17   78.185\n",
       "18   58.237\n",
       "19   87.361\n",
       "20   75.233\n",
       "dtype: float64"
      ]
     },
     "execution_count": 87,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "(table['Neural net Banzhaf'] - table['Linear Banzhaf']) / table['Linear Banzhaf'] * -100"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 85,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "N\n",
       "4    48.628\n",
       "5    58.254\n",
       "6    68.083\n",
       "7    69.255\n",
       "8    76.785\n",
       "9    83.170\n",
       "10   83.093\n",
       "11   86.225\n",
       "12   88.302\n",
       "13   73.949\n",
       "14   89.240\n",
       "15   87.853\n",
       "16   87.088\n",
       "17   85.419\n",
       "18   76.665\n",
       "19   72.952\n",
       "20   74.207\n",
       "dtype: float64"
      ]
     },
     "execution_count": 85,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "(table['Neural net Shapley'] - table['Linear Shapley']) / table['Linear Shapley'] * -100"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 86,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "N\n",
       "4    58.216\n",
       "5    47.108\n",
       "6    52.687\n",
       "7    62.327\n",
       "8    72.436\n",
       "9    77.964\n",
       "10   82.125\n",
       "11   86.360\n",
       "12   85.997\n",
       "13   90.563\n",
       "14   91.008\n",
       "15   91.541\n",
       "16   94.143\n",
       "17   93.613\n",
       "18   90.471\n",
       "19   94.550\n",
       "20   93.702\n",
       "dtype: float64"
      ]
     },
     "execution_count": 86,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "(table['Neural net Core'] - table['Linear Core']) / table['Linear Core'] * -100"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Training script\n",
    "\n",
    "---"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# TRAIN_DATA_PATH = 'WeightedVotingGames/Data/TrainDataFixed/'\n",
    "# TEST_DATA_PATH = 'WeightedVotingGames/Data/TestDataFixed/'\n",
    "\n",
    "# solution_concept = 'Y_shap'\n",
    "# MIN_PLAY_SIZE = 4\n",
    "# MAX_PLAY_SIZE = 21\n",
    "# errors = torch.zeros(MAX_PLAY_SIZE - MIN_PLAY_SIZE)\n",
    "\n",
    "# iter = 0\n",
    "\n",
    "# for NUM_PLAY in range(MIN_PLAY_SIZE, MAX_PLAY_SIZE):\n",
    "\n",
    "#     print(f'Training linear model with {NUM_PLAY} players')\n",
    "\n",
    "#     with open(f'{TRAIN_DATA_PATH}{NUM_PLAY}players_train.pickle', 'rb') as handle:\n",
    "#         train_dict = pickle.load(handle)\n",
    "\n",
    "#     with open(f'{TEST_DATA_PATH}{NUM_PLAY}players_test_mpi_in_sample.pickle', 'rb') as handle:\n",
    "#         test_dict = pickle.load(handle)\n",
    "\n",
    "#     class WVGDataset(Dataset):\n",
    "#         def __init__(self, X, Y):\n",
    "#             self.X = X\n",
    "#             self.Y = Y\n",
    "#         def __len__(self):\n",
    "#             return self.X.shape[0]\n",
    "#         def __getitem__(self, index):\n",
    "#             return (\n",
    "#                 self.X[index, :].float(),\n",
    "#                 self.Y[index, :].float()\n",
    "#             )\n",
    "\n",
    "#     train_set = WVGDataset(\n",
    "#         test_dict['X'],\n",
    "#         test_dict[solution_concept]\n",
    "#     )\n",
    "\n",
    "#     test_set = WVGDataset(\n",
    "#         test_dict['X'],\n",
    "#         test_dict[solution_concept]\n",
    "#     )\n",
    "\n",
    "#     batch_size = 100\n",
    "#     num_epochs = 50\n",
    "\n",
    "#     train_loader = DataLoader(\n",
    "#         train_set,\n",
    "#         batch_size=batch_size,\n",
    "#     )\n",
    "\n",
    "#     test_loader = DataLoader(\n",
    "#         test_set,\n",
    "#         batch_size=batch_size,\n",
    "#     )\n",
    "\n",
    "#     # Create linear model\n",
    "#     linear_model = models.MultinomialRegression(\n",
    "#         input_size = NUM_PLAY,\n",
    "#         output_size = NUM_PLAY,\n",
    "#     )\n",
    "\n",
    "#     # Set loss function and optimizer\n",
    "#     learning_rate = 1e-3\n",
    "#     optimizer = torch.optim.SGD(linear_model.parameters(), lr=learning_rate)  \n",
    "#     loss_fn = nn.MSELoss()\n",
    "\n",
    "#     ''' Train '''\n",
    "#     for epoch in range(num_epochs):\n",
    "#         for i, (x, y) in enumerate(train_loader):\n",
    "\n",
    "#             optimizer.zero_grad()\n",
    "\n",
    "#             # Forward pass to get output/logits\n",
    "#             y_pred = linear_model(x)\n",
    "\n",
    "#             # Calculate Loss: softmax --> cross entropy loss\n",
    "#             loss = loss_fn(y_pred, y)\n",
    "\n",
    "#             # Getting gradients w.r.t. parameters\n",
    "#             loss.backward()\n",
    "\n",
    "#             # Updating parameters\n",
    "#             optimizer.step()\n",
    "\n",
    "#     ''' Test ''' \n",
    "#     predictions = torch.zeros((num_epochs, batch_size, NUM_PLAY))\n",
    "#     actual = torch.zeros((num_epochs, batch_size, NUM_PLAY))\n",
    "\n",
    "#     print(f'Evaluating linear model with {NUM_PLAY} players \\n')\n",
    "\n",
    "#     for epoch in range(num_epochs):\n",
    "#         linear_model.eval()\n",
    "#         for i, (x, y) in enumerate(test_loader):\n",
    "\n",
    "#             # Forward pass to get output/logits\n",
    "#             y_pred = linear_model(x)\n",
    "#             predictions[epoch, :, :] = y_pred\n",
    "#             actual[epoch, :, :] = y\n",
    "\n",
    "#             # Calculate Loss: softmax --> cross entropy loss\n",
    "#             loss = loss_fn(y_pred, y)\n",
    "\n",
    "#             # Getting gradients w.r.t. parameters\n",
    "#             loss.backward()\n",
    "\n",
    "#             # Updating parameters\n",
    "#             optimizer.step()\n",
    "    \n",
    "#     errors[iter] = torch.absolute(predictions - actual).mean()\n",
    "\n",
    "#     iter+=1\n",
    "#torch.save(errors, f'MAEs_multinomial_logit_{solution_concept}')a"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3.9.7 ('rebuttal')",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  },
  "orig_nbformat": 4,
  "vscode": {
   "interpreter": {
    "hash": "8b4c61b0c0dfa50a12dd4948992e6e1a04659874706c6edcf781c314bdb1c462"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
