{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "0gWZiPIqJqRQ"
   },
   "outputs": [],
   "source": [
    "base_dset = 'sst2'\n",
    "\n",
    "test1_dset = 'imdb'\n",
    "test2_dset = 'yelp_polarity'\n",
    "test3_dset = 'sst2'\n",
    "\n",
    "assert base_dset in ['imdb', 'yelp_polarity', 'sst2']"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "2w3VlLs3v0zX"
   },
   "source": [
    "# Reproducability"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "SrY2aGs5vzzU"
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import tensorflow as tf\n",
    "import random\n",
    "import os\n",
    "\n",
    "seed = 42\n",
    "\n",
    "# The below is necessary for starting Numpy generated random numbers\n",
    "# in a well-defined initial state.\n",
    "np.random.seed(seed)\n",
    "\n",
    "# The below is necessary for starting core Python generated random numbers\n",
    "# in a well-defined state.\n",
    "random.seed(seed)\n",
    "\n",
    "# The below set_seed() will make random number generation\n",
    "# in the TensorFlow backend have a well-defined initial state.\n",
    "tf.random.set_seed(seed)\n",
    "\n",
    "# ENV variables\n",
    "# GPUs need to be disabled since they produce non-deterministic results\n",
    "os.environ['CUDA_VISIBLE_DEVICES']= '0'\n",
    "os.environ['PYTHONHASHSEED'] = str(seed)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "A6QiXcg8aR5j"
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "from sklearn import metrics\n",
    "from sklearn.naive_bayes import GaussianNB, MultinomialNB, BernoulliNB\n",
    "from sklearn.linear_model import LogisticRegression, SGDClassifier\n",
    "from sklearn.svm import SVC, LinearSVC, NuSVC\n",
    "from sklearn.metrics import accuracy_score, classification_report\n",
    "from joblib import dump, load \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "C1r8gjH9laNI"
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "#test = np.load('/content/BiLSTM_AGNews_shapvals_100000_labels.npy')\n",
    "#print(test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "qD4qrtqAaR58"
   },
   "outputs": [],
   "source": [
    "from sklearn.model_selection import train_test_split\n",
    "from sklearn.preprocessing import StandardScaler\n",
    "\n",
    "if base_dset == 'imdb':\n",
    "  data_x_path = 'data/IMDB/BiLSTM_IMDB_shapvals_3580.npy'\n",
    "  data_y_path = 'data/IMDB/BiLSTM_IMDB_shapvals_3580_labels.npy'\n",
    "elif base_dset == 'yelp_polarity':\n",
    "  data_x_path = 'data/Yelp_Polarity/BiLSTM_Yelp_Polarity_shapvals_940.npy'\n",
    "  data_y_path = 'data/Yelp_Polarity/BiLSTM_Yelp_Polarity_shapvals_940_labels.npy'\n",
    "elif base_dset == 'sst2':\n",
    "  data_x_path = 'data/SST2/BiLSTM_SST2_shapvals_3162.npy'\n",
    "  data_y_path = 'data/SST2/BiLSTM_SST2_shapvals_3162_labels.npy'\n",
    "else:\n",
    "  raise NotImplementedError\n",
    "\n",
    "data_x = np.load(data_x_path)\n",
    "data_y = np.load(data_y_path)\n",
    "\n",
    "\n",
    "test1_data_x_path = 'data/IMDB/BiLSTM_IMDB_shapvals_3580.npy'\n",
    "test1_data_y_path = 'data/IMDB/BiLSTM_IMDB_shapvals_3580_labels.npy'\n",
    "\n",
    "test2_data_x_path = 'data/Yelp_Polarity/BiLSTM_Yelp_Polarity_shapvals_940.npy'\n",
    "test2_data_y_path = 'data/Yelp_Polarity/BiLSTM_Yelp_Polarity_shapvals_940_labels.npy'\n",
    "\n",
    "test3_data_x_path = 'data/SST2/BiLSTM_SST2_shapvals_3162.npy'\n",
    "test3_data_y_path = 'data/SST2/BiLSTM_SST2_shapvals_3162_labels.npy'\n",
    "\n",
    "\n",
    "test1_data_x = np.load(test1_data_x_path)\n",
    "test1_data_y = np.load(test1_data_y_path)\n",
    "test2_data_x = np.load(test2_data_x_path)\n",
    "test2_data_y = np.load(test2_data_y_path)\n",
    "test3_data_x = np.load(test3_data_x_path)\n",
    "test3_data_y = np.load(test3_data_y_path)\n",
    "\n",
    "x_train, x_test, y_train, y_test = train_test_split(data_x, data_y, random_state=0, shuffle=True, train_size=0.8)\n",
    "test1_x_train, test1_x_test, test1_y_train, test1_y_test = train_test_split(test1_data_x, test1_data_y, random_state=0, shuffle=True, train_size=0.8)\n",
    "test2_x_train, test2_x_test, test2_y_train, test2_y_test = train_test_split(test2_data_x, test2_data_y, random_state=0, shuffle=True, train_size=0.8)\n",
    "test3_x_train, test3_x_test, test3_y_train, test3_y_test = train_test_split(test3_data_x, test3_data_y, random_state=0, shuffle=True, train_size=0.8)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "c0e3eASOeD2F"
   },
   "outputs": [],
   "source": [
    "def draw_confusion_matrix(y_test, preds, classifier_name=''):\n",
    "  score = accuracy_score(y_test, preds)\n",
    "  cm = metrics.confusion_matrix(y_test, preds)\n",
    "\n",
    "  plt.figure(figsize=(9,9))\n",
    "  sns.heatmap(cm, annot=True, fmt=\".0f\", linewidths=.5, square = True, cmap = 'OrRd', xticklabels=['Original', 'Adversial'], yticklabels=['Original', 'Adversial'])\n",
    "  plt.ylabel('Actual label')\n",
    "  plt.xlabel('Predicted label')\n",
    "  all_sample_title = '{0}\\n Accuracy Score: {1}'.format(classifier_name, score)\n",
    "  plt.title(all_sample_title, size = 15)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "G9q0R5VReRJV"
   },
   "source": [
    "# Random Forest Classifier"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000
    },
    "id": "pHv2_36iaR6F",
    "outputId": "2dda8c0d-0363-4e86-86a2-2133c6537013"
   },
   "outputs": [],
   "source": [
    "from sklearn.ensemble import RandomForestClassifier\n",
    "randomF = RandomForestClassifier(random_state=42)\n",
    "randomF.fit(x_train,y_train)\n",
    "\n",
    "preds = randomF.predict(test1_x_test)\n",
    "draw_confusion_matrix(test1_y_test, preds, 'Random Forest Classifier Testset IMDB')\n",
    "print(classification_report(test1_y_test, preds))\n",
    "\n",
    "preds = randomF.predict(test2_x_test)\n",
    "draw_confusion_matrix(test2_y_test, preds, 'Random Forest Classifier Testset Yelp_Polarity')\n",
    "print(classification_report(test2_y_test, preds))\n",
    "\n",
    "preds = randomF.predict(test3_x_test)\n",
    "draw_confusion_matrix(test3_y_test, preds, 'Random Forest Classifier Testset SST-2')\n",
    "print(classification_report(test3_y_test, preds))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "QBC5hVZleWAW"
   },
   "source": [
    "# Multilayer Neural Network"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000
    },
    "id": "qxpZBrgcaR6R",
    "outputId": "05647662-05a0-4810-8e5b-75878ff12c80"
   },
   "outputs": [],
   "source": [
    "# Try the same in Keras\n",
    "import tensorflow as tf\n",
    "from tensorflow.keras.initializers import glorot_uniform\n",
    "from tensorflow.keras.regularizers import l1\n",
    "\n",
    "\n",
    "input_shape = 200\n",
    "\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(400, input_shape=(input_shape,), activation='relu', kernel_regularizer=l1(0.00001), kernel_initializer=glorot_uniform(seed=42)),\n",
    "    tf.keras.layers.Dropout(0.5, seed=42),\n",
    "    tf.keras.layers.Dense(400, activation='relu', kernel_regularizer=l1(0.00001), kernel_initializer=glorot_uniform(seed=42)),\n",
    "    tf.keras.layers.Dense(1, activation='sigmoid', kernel_initializer=glorot_uniform(seed=seed))\n",
    "])\n",
    "\n",
    "model.compile(optimizer='adam',\n",
    "              loss='binary_crossentropy',\n",
    "              metrics=['accuracy'])\n",
    "\n",
    "model.fit(x_train, y_train, epochs=10, validation_split=0.1)\n",
    "model.evaluate(x_test, y_test)\n",
    "\n",
    "preds = model.predict(test1_x_test)\n",
    "preds = preds.flatten()\n",
    "preds[preds < 0.5] = 0\n",
    "preds[preds >= 0.5] = 1\n",
    "draw_confusion_matrix(test1_y_test, preds, 'Multilayer Neural Network Testset IMDB')\n",
    "print(classification_report(test1_y_test, preds))\n",
    "\n",
    "preds = model.predict(test2_x_test)\n",
    "preds = preds.flatten()\n",
    "preds[preds < 0.5] = 0\n",
    "preds[preds >= 0.5] = 1\n",
    "draw_confusion_matrix(test2_y_test, preds, 'Multilayer Neural Network Testset Yelp_Polarity')\n",
    "print(classification_report(test2_y_test, preds))\n",
    "\n",
    "preds = model.predict(test3_x_test)\n",
    "preds = preds.flatten()\n",
    "preds[preds < 0.5] = 0\n",
    "preds[preds >= 0.5] = 1\n",
    "draw_confusion_matrix(test3_y_test, preds, 'Multilayer Neural Network Testset SST2')\n",
    "print(classification_report(test3_y_test, preds))\n"
   ]
  }
 ],
 "metadata": {
  "accelerator": "GPU",
  "colab": {
   "collapsed_sections": [
    "uRUMgisCbgs8",
    "A3iyqbuNb9kl",
    "qOO4KyxCcOID",
    "T8llR4x3cbPD",
    "9arIRas1clxg",
    "qUIf1br_dI0d",
    "a1h6k423dQ7n",
    "I31EqMytdsGm",
    "n53jvb8Kn3ea"
   ],
   "name": "Transferability_SHAP_Detector(1).ipynb",
   "provenance": [],
   "toc_visible": true
  },
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
