{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "sesdLmc9PWcO"
   },
   "source": [
    "# Detector F1-Scores\n",
    "\n",
    "| Classifier     | AG_News | IMDB (normalized) | SST2 | Yelp_Polarity (normalized) |\n",
    "|----------------|---------|-------------------|------|----------------------------|\n",
    "| Neural Network | 0.90    | 0.96              | 0.76 | 0.93                       |\n",
    "| Random Forest  | 0.91    | 0.87              | 0.77 | 0.84                       |\n",
    "| SVM            | 0.90    | 0.90              | 0.74 | 0.89                       |\n",
    "| Linear SVM     | 0.67    | 0.42              | 0.65 | 0.26                       |"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "0gWZiPIqJqRQ"
   },
   "outputs": [],
   "source": [
    "######### CHANGE DATASET AND NORMALIZATION MODE HERE ##########\n",
    "mode = 'normalized'\n",
    "dset = 'ag_news'\n",
    "\n",
    "assert mode in ['normalized', 'normalized_pred', 'unnormalized', 'unnormalized_pred'], 'Wrong mode'\n",
    "assert dset in ['imdb', 'ag_news', 'yelp_polarity', 'sst2']\n",
    "\n",
    "use_norm = False\n",
    "use_pred = False\n",
    "\n",
    "if 'pred' in mode: # Only works for AG_News so far\n",
    "  use_pred = True\n",
    "\n",
    "if mode.startswith('normalized'):\n",
    "  use_norm = True"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "2w3VlLs3v0zX"
   },
   "source": [
    "## Reproducability"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "SrY2aGs5vzzU"
   },
   "outputs": [],
   "source": [
    "# From https://keras.io/getting_started/faq/\n",
    "\n",
    "import numpy as np\n",
    "import tensorflow as tf\n",
    "import random\n",
    "import os\n",
    "\n",
    "seed = 42\n",
    "\n",
    "# The below is necessary for starting Numpy generated random numbers\n",
    "# in a well-defined initial state.\n",
    "np.random.seed(seed)\n",
    "\n",
    "# The below is necessary for starting core Python generated random numbers\n",
    "# in a well-defined state.\n",
    "random.seed(seed)\n",
    "\n",
    "# The below set_seed() will make random number generation\n",
    "# in the TensorFlow backend fhave a well-defined initial state.\n",
    "tf.random.set_seed(seed)\n",
    "\n",
    "# ENV variables\n",
    "# GPUs need to be disabled since they produce non-deterministic results\n",
    "os.environ['CUDA_VISIBLE_DEVICES']= '0'\n",
    "os.environ['PYTHONHASHSEED'] = str(seed)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "A6QiXcg8aR5j"
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "from sklearn import metrics\n",
    "from sklearn.naive_bayes import GaussianNB, MultinomialNB, BernoulliNB\n",
    "from sklearn.linear_model import LogisticRegression, SGDClassifier\n",
    "from sklearn.svm import SVC, LinearSVC, NuSVC\n",
    "from sklearn.metrics import accuracy_score, classification_report\n",
    "from joblib import dump, load \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "qD4qrtqAaR58",
    "outputId": "11affc4c-0b01-4548-b7ac-d093a3ee1e1d"
   },
   "outputs": [],
   "source": [
    "from sklearn.model_selection import train_test_split\n",
    "from sklearn.preprocessing import StandardScaler\n",
    "\n",
    "\n",
    "if dset == 'ag_news':\n",
    "  data_x_path = 'data/AG_News/BiLSTM_AGNews_shapvals_100000.npy'\n",
    "  data_y_path = 'data/AG_News/BiLSTM_AGNews_shapvals_100000_labels.npy'\n",
    "elif dset == 'imdb':\n",
    "  data_x_path = 'data/IMDB/BiLSTM_IMDB_shapvals_3580.npy'\n",
    "  data_y_path = 'data/IMDB/BiLSTM_IMDB_shapvals_3580_labels.npy'\n",
    "elif dset == 'yelp_polarity':\n",
    "  data_x_path = 'data/Yelp_Polarity/BiLSTM_Yelp_Polarity_shapvals_940.npy'\n",
    "  data_y_path = 'data/Yelp_Polarity/BiLSTM_Yelp_Polarity_shapvals_940_labels.npy'\n",
    "elif dset == 'sst2':\n",
    "  data_x_path = 'data/SST2/BiLSTM_SST2_shapvals_3162.npy'\n",
    "  data_y_path = 'data/SST2/BiLSTM_SST2_shapvals_3162_labels.npy'\n",
    "else:\n",
    "  raise NotImplementedError\n",
    "\n",
    "'''if dset == 'ag_news':\n",
    "  data_x_path = 'data/AG_News_shapvals.npy'\n",
    "  data_y_path = 'data/AG_News_labels.npy'\n",
    "elif dset == 'imdb':\n",
    "  data_x_path = 'data/IMDB/BiLSTM_IMDB_shapvals_3580.npy'\n",
    "  data_y_path = 'data/IMDB/BiLSTM_IMDB_shapvals_3580_labels.npy'\n",
    "elif dset == 'yelp_polarity':\n",
    "  data_x_path = 'data/Yelp_Polarity/BiLSTM_Yelp_Polarity_shapvals_940.npy'\n",
    "  data_y_path = 'data/Yelp_Polarity/BiLSTM_Yelp_Polarity_shapvals_940_labels.npy'\n",
    "elif dset == 'sst2':\n",
    "  data_x_path = 'data/SST2/BiLSTM_SST2_shapvals_3162.npy'\n",
    "  data_y_path = 'data/SST2/BiLSTM_SST2_shapvals_3162_labels.npy'\n",
    "else:\n",
    "  raise NotImplementedError'''\n",
    "\n",
    "\n",
    "data_x = np.load(data_x_path)\n",
    "data_y = np.load(data_y_path)\n",
    "\n",
    "# Augment by class prediction\n",
    "# Only works for AG_News so far\n",
    "if use_pred and dset == 'ag_news':\n",
    "  org_preds = np.load('BiLSTM_AGNews_org_preds.npy')\n",
    "  adv_preds = np.load('BiLSTM_AGNews_adv_preds.npy')\n",
    "  preds = np.concatenate((org_preds, adv_preds))\n",
    "  preds = np.expand_dims(preds, axis=1)\n",
    "  preds = preds.astype('float64')\n",
    "  data_x = np.append(data_x, preds, axis=1)\n",
    "  print('Using SHAP values + predictions')\n",
    "else:\n",
    "  use_pred = False\n",
    "  print('Using SHAP values only')\n",
    "\n",
    "x_train, x_test, y_train, y_test = train_test_split(data_x, data_y, random_state=0, shuffle=True, train_size=0.8)\n",
    "\n",
    "print(f'Using {dset}')\n",
    "# Normalize\n",
    "if use_norm:\n",
    "  scaler = StandardScaler()\n",
    "  x_train = scaler.fit_transform(x_train)\n",
    "  x_test = scaler.transform(x_test)\n",
    "  print('Using normalized data')\n",
    "else:\n",
    "  print('Using unnormalized data')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "c0e3eASOeD2F"
   },
   "outputs": [],
   "source": [
    "def draw_confusion_matrix(y_test, preds, classifier_name=''):\n",
    "  score = accuracy_score(y_test, preds)\n",
    "  cm = metrics.confusion_matrix(y_test, preds)\n",
    "\n",
    "  plt.figure(figsize=(9,9))\n",
    "  sns.heatmap(cm, annot=True, fmt=\".0f\", linewidths=.5, square = True, cmap = 'OrRd', xticklabels=['Original', 'Adversial'], yticklabels=['Original', 'Adversial'])\n",
    "  plt.ylabel('Actual label')\n",
    "  plt.xlabel('Predicted label')\n",
    "  all_sample_title = '{0}\\n Accuracy Score: {1}'.format(classifier_name, score)\n",
    "  plt.title(all_sample_title, size = 15)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "QBC5hVZleWAW"
   },
   "source": [
    "## Multilayer Neural Network"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "qxpZBrgcaR6R"
   },
   "outputs": [],
   "source": [
    "import tensorflow as tf\n",
    "from tensorflow.keras.initializers import glorot_uniform\n",
    "from tensorflow.keras.regularizers import l1\n",
    "\n",
    "if dset == 'ag_news':\n",
    "  input_shape = 400\n",
    "elif dset == 'imdb':\n",
    "  input_shape = 200\n",
    "elif dset == 'yelp_polarity':\n",
    "  input_shape = 200\n",
    "elif dset == 'sst2':\n",
    "  input_shape = 200\n",
    "\n",
    "if use_pred:\n",
    "  input_shape += 1\n",
    "\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(400, input_shape=(input_shape,), activation='relu', kernel_regularizer=l1(0.00001), kernel_initializer=glorot_uniform(seed=42)),\n",
    "    tf.keras.layers.Dropout(0.5, seed=42),\n",
    "    tf.keras.layers.Dense(400, activation='relu', kernel_regularizer=l1(0.00001), kernel_initializer=glorot_uniform(seed=42)),\n",
    "    tf.keras.layers.Dense(1, activation='sigmoid', kernel_initializer=glorot_uniform(seed=seed))\n",
    "])\n",
    "\n",
    "model.compile(optimizer='adam',\n",
    "              loss='binary_crossentropy',\n",
    "              metrics=['accuracy'])\n",
    "\n",
    "model.fit(x_train, y_train, epochs=10)\n",
    "model.evaluate(x_test, y_test)\n",
    "\n",
    "preds = model.predict(x_test)\n",
    "preds = preds.flatten()\n",
    "preds[preds < 0.5] = 0\n",
    "preds[preds >= 0.5] = 1\n",
    "draw_confusion_matrix(y_test, preds, f'Multilayer Neural Network {dset}')\n",
    "print(classification_report(y_test, preds))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "G9q0R5VReRJV"
   },
   "source": [
    "## Random Forest"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "pHv2_36iaR6F"
   },
   "outputs": [],
   "source": [
    "from sklearn.ensemble import RandomForestClassifier\n",
    "randomF = RandomForestClassifier(random_state=42)\n",
    "randomF.fit(x_train,y_train)\n",
    "preds = randomF.predict(x_test)\n",
    "draw_confusion_matrix(y_test, preds, 'Random Forest')\n",
    "print(classification_report(y_test, preds))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "qUIf1br_dI0d"
   },
   "source": [
    "## Support Vector Machine (SVM)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000
    },
    "id": "E1qT8ztZclFU",
    "outputId": "4f472016-57e7-4ab9-8238-2f7e6d23c34c"
   },
   "outputs": [],
   "source": [
    "from sklearn.svm import SVC\n",
    "SVC = SVC(random_state=42)\n",
    "SVC.fit(x_train,y_train)\n",
    "preds = SVC.predict(x_test)\n",
    "draw_confusion_matrix(y_test, preds, 'SVM')\n",
    "print(classification_report(y_test, preds))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "a1h6k423dQ7n"
   },
   "source": [
    "## Linear Support Vector Machine (Linear SVM)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000
    },
    "id": "GPiVQfdAdrwJ",
    "outputId": "2b33e637-ddc4-49d7-e1bf-d757cb7653d2"
   },
   "outputs": [],
   "source": [
    "from sklearn.svm import LinearSVC\n",
    "LSVC = LinearSVC(random_state=42)\n",
    "LSVC.fit(x_train,y_train)\n",
    "preds = LSVC.predict(x_test)\n",
    "draw_confusion_matrix(y_test, preds, 'Linear SVM')\n",
    "print(classification_report(y_test, preds))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Extra classifiers"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "uRUMgisCbgs8"
   },
   "source": [
    "## Gaussian Naive Bayes\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 685
    },
    "id": "qsMizKHabEq4",
    "outputId": "25440630-ad1a-4fe7-fb07-160f07418639"
   },
   "outputs": [],
   "source": [
    "from sklearn.naive_bayes import GaussianNB\n",
    "gnb = GaussianNB()\n",
    "gnb.fit(x_train, y_train)\n",
    "preds = gnb.predict(x_test)\n",
    "draw_confusion_matrix(y_test, preds, 'Gaussian Naive Bayes')\n",
    "print(classification_report(y_test, preds))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "qOO4KyxCcOID"
   },
   "source": [
    "## Bernoulli Naive Bayes\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000
    },
    "id": "FSB4QIbDbE_f",
    "outputId": "68c5517c-655f-4d09-cca0-201690e60f22"
   },
   "outputs": [],
   "source": [
    "from sklearn.naive_bayes import BernoulliNB\n",
    "BNB = BernoulliNB()\n",
    "BNB.fit(x_train,y_train)\n",
    "preds = BNB.predict(x_test)\n",
    "draw_confusion_matrix(y_test, preds, 'Bernoulli Naives Bayes')\n",
    "print(classification_report(y_test, preds))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "T8llR4x3cbPD"
   },
   "source": [
    "## Logistic Regression"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000
    },
    "id": "ZF0s_pd0bFEW",
    "outputId": "94573096-2bfc-4888-8cb5-6b06ee68a983"
   },
   "outputs": [],
   "source": [
    "from sklearn.linear_model import LogisticRegression\n",
    "LR = LogisticRegression(random_state=42)\n",
    "LR.fit(x_train,y_train)\n",
    "preds = LR.predict(x_test)\n",
    "draw_confusion_matrix(y_test, preds, 'Logistic Regression')\n",
    "print(classification_report(y_test, preds))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "I31EqMytdsGm"
   },
   "source": [
    "## Nu-Support Vector Machine"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "-ke0vAwSdsSp"
   },
   "outputs": [],
   "source": [
    "from sklearn.svm import NuSVC\n",
    "NSVC = NuSVC(random_state=42)\n",
    "NSVC.fit(x_train,y_train)\n",
    "preds = NSVC.predict(x_test)\n",
    "draw_confusion_matrix(y_test, preds, 'Nu-Support Vector Machine')\n",
    "print(classification_report(y_test, preds))"
   ]
  }
 ],
 "metadata": {
  "colab": {
   "collapsed_sections": [],
   "name": "SHAP_Detector.ipynb",
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
