{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 77786,
     "status": "ok",
     "timestamp": 1652363005478,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "8hceYqOsrvR9",
    "outputId": "8f8cab7b-be1a-489f-d6bd-5b486c5bc4f0"
   },
   "outputs": [],
   "source": [
    "import os\n",
    "import sys\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 11767,
     "status": "ok",
     "timestamp": 1652363017240,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "fy_wPf0hr3cK"
   },
   "outputs": [],
   "source": [
    "import deel.lip as lip\n",
    "from deel.lip.layers import *\n",
    "from deel.lip.losses import *\n",
    "from deel.lip.utils import *\n",
    "\n",
    "import dlt\n",
    "import dlt.data.loader as loader\n",
    "import dlt.data.pipeline as pipeline\n",
    "import dlt.data.augmentation as aug\n",
    "import dlt.infrastructure.distributed_training as distributed\n",
    "from dlt.extras.layers import skip_connections as skips\n",
    "from dlt.model_factory import *\n",
    "\n",
    "import tensorflow as tf\n",
    "import numpy as np\n",
    "\n",
    "from xplique.attributions import *\n",
    "from xplique.metrics import *\n",
    "\n",
    "import matplotlib.pyplot as plt\n",
    "from scipy.stats import spearmanr\n",
    "from scipy.ndimage import gaussian_filter\n",
    "\n",
    "import tensorflow.keras.optimizers as optimizers\n",
    "from tensorflow.keras.models import Sequential, Model\n",
    "from tensorflow.keras.layers import Dense, Activation\n",
    "import tensorflow_datasets as tfds\n",
    "\n",
    "\n",
    "plt.style.use('seaborn')\n",
    "%config InlineBackend.figure_format = 'retina'\n",
    "def set_size(w,h):\n",
    "  \"\"\"Set matplot figure size\"\"\"\n",
    "  plt.rcParams[\"figure.figsize\"] = [w,h]\n",
    "\n",
    "def show(img, p=False, smooth=False, **kwargs):\n",
    "  \"\"\"handle imshow of images and cmaps\"\"\"\n",
    "  img = np.array(img, dtype=np.float32)\n",
    "\n",
    "  # check if channel first\n",
    "  if img.shape[0] == 1:\n",
    "    img = img[0]\n",
    "  elif img.shape[0] == 3:\n",
    "    img = np.moveaxis(img, 0, 2)\n",
    "  # check if cmap\n",
    "  if img.shape[-1] == 1:\n",
    "    img = img[:,:,0]\n",
    "  # normalize\n",
    "  if img.max() > 1 or img.min() < 0:\n",
    "    img -= img.min(); img/=img.max()\n",
    "  # check if clip percentile\n",
    "  if p is not False:\n",
    "    img = np.clip(img, np.percentile(img, p), np.percentile(img, 100-p))\n",
    "  \n",
    "  if smooth and len(img.shape) == 2:\n",
    "    img = gaussian_filter(img, smooth)\n",
    "\n",
    "  plt.imshow(img, **kwargs)\n",
    "  plt.axis('off')\n",
    "  plt.grid(None)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 6,
     "status": "ok",
     "timestamp": 1652363017520,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "JORuiURyvCTh"
   },
   "outputs": [],
   "source": [
    "from tensorflow.keras.models import (\n",
    "    load_model as keras_load_model,\n",
    "    model_from_json as keras_model_from_json,\n",
    "    model_from_yaml as keras_model_from_yaml,\n",
    ")\n",
    "\n",
    "model_path = \"/content/drive/MyDrive/HKR XAI/CelebA\"\n",
    "\n",
    "batch_size = 512\n",
    "norm_factor = 255.0\n",
    "alphaHKR = 20.0\n",
    "min_margin = 0.2\n",
    "learning_rate = 1e-2\n",
    "selected_classes = np.array([2, 4, 7, 8, 9, 10, 11, 15, 17, 18, 20, 21, 22, 28, 29, 30, 31, 34, 35, 36, 38, 39])\n",
    "\n",
    "def load_network(net_path,net_name, use_json=False):\n",
    "    modelPath2 = os.path.join(net_path,net_name)\n",
    "    if use_json:\n",
    "        json_file = open(modelPath2+'.json', 'r')\n",
    "        loaded_model_json = json_file.read()\n",
    "        json_file.close()\n",
    "        loaded_model = keras_model_from_json(loaded_model_json)\n",
    "        # load weights into new model\n",
    "        loaded_model.load_weights(modelPath2+'.h5')\n",
    "    else:\n",
    "        loaded_model = keras_load_model(modelPath2+'.h5',compile=False)\n",
    "    #loaded_model.summary()\n",
    "    print(\"Loaded model from disk\")\n",
    "    return loaded_model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 2496,
     "status": "ok",
     "timestamp": 1652363020011,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "zio5jeHD6onY",
    "outputId": "a9353333-66dd-4aea-b7be-616b85a9e1a9"
   },
   "outputs": [],
   "source": [
    "model_name = \"model_22labels_unconstrained_epoch100_fullmodel\"\n",
    "chosen_label_name = 'Mustache' #'Wearing_Hat' # 'Gray_Hair'  #'Bald' #'Heavy_Makeup' #'Wearing_Lipstick' #'Mustache'\n",
    "\n",
    "model = load_network(model_path,model_name)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 944,
     "status": "ok",
     "timestamp": 1652363020952,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "GnQ6riROu2-L",
    "outputId": "e3341f32-9920-4ba1-ae98-2e6f3f9a2de3"
   },
   "outputs": [],
   "source": [
    "AUTO = tf.data.AUTOTUNE\n",
    "\n",
    "gcs_base_dir = \"gs://celeb_a_dataset/\"\n",
    "celeb_a_builder = tfds.builder(\"celeb_a\", data_dir=gcs_base_dir, version='2.0.0')\n",
    "celeb_a_builder.download_and_prepare()\n",
    "\n",
    "num_test_shards_dict = {'0.3.0': 4, '2.0.0': 2} # Used because we download the test dataset separately\n",
    "version = str(celeb_a_builder.info.version)\n",
    "print('Celeb_A dataset version: %s' % version)\n",
    "\n",
    "def make_ds():\n",
    "  ds = celeb_a_builder.as_dataset(split='test')\n",
    "  return ds\n",
    "\n",
    "def make_binary_dataset(ds, label_name):\n",
    "  ds = ds.map(lambda data: (tf.cast(data['image'], tf.float32) / norm_factor, data['attributes'][label_name]), num_parallel_calls=AUTO)\n",
    "  ds = ds.map(lambda x,y: (x, tf.one_hot(tf.cast(y, tf.uint8), 2)), num_parallel_calls=AUTO)\n",
    "  return ds"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000,
     "output_embedded_package_id": "1PbwnAPN-XqiO7CVq1GyrKa1k-1BeRkcC"
    },
    "executionInfo": {
     "elapsed": 34608,
     "status": "ok",
     "timestamp": 1652349133180,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "PU4lulnx30Ss",
    "outputId": "a40147bb-4c9d-4272-e662-e35cf25f32c5"
   },
   "outputs": [],
   "source": [
    "ds_binary = make_binary_dataset(make_ds(), chosen_label_name)\n",
    "\n",
    "i = 1\n",
    "set_size(15, 15)\n",
    "for x,y in ds_binary.take(99):\n",
    "  plt.subplot(10, 10, i+1)\n",
    "  show(x)\n",
    "  plt.title(np.argmax(y))\n",
    "  i+=1\n",
    "plt.tight_layout()\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1836,
     "status": "ok",
     "timestamp": 1652363022785,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "UlMP7NPS8G4D",
    "outputId": "29efdc66-c6e0-4c6d-ffbd-6a51719eb64b"
   },
   "outputs": [],
   "source": [
    "ds = make_ds()\n",
    "data = [d for d in ds.take(1)][0]\n",
    "\n",
    "class_names = np.array([k for k in data['attributes'].keys()])\n",
    "assert class_names[0] == '5_o_Clock_Shadow'\n",
    "assert class_names[-1] == 'Young'\n",
    "\n",
    "print('x:', data['image'].shape, ' attributes:', class_names)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 7,
     "status": "ok",
     "timestamp": 1652363022785,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "khgc9Zu_uDDM",
    "outputId": "6d87a6cd-0d75-4c2c-a5bb-9244bf896830"
   },
   "outputs": [],
   "source": [
    "if selected_classes is None:\n",
    "    nb_classes = len(class_names)\n",
    "    all_selected_classes = np.ones((nb_classes,)).astype(np.bool)\n",
    "else:\n",
    "    print(list(selected_classes))\n",
    "    nb_classes = len(set(selected_classes))\n",
    "    one_hot = np.eye(len(class_names))[selected_classes]\n",
    "    all_selected_classes = np.sum(one_hot,axis=0).astype(np.bool)\n",
    "print(all_selected_classes)\n",
    "print(\"nb_classes \", nb_classes)\n",
    "print(\"Selected classes :\", np.asarray(class_names)[all_selected_classes])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 4,
     "status": "ok",
     "timestamp": 1652363022786,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "TzIJ_zt1-fE7"
   },
   "outputs": [],
   "source": [
    "def make_binary_classif_model(loaded_model, last_layer, label, reverse=1.0, biais=0.0):\n",
    "\n",
    "    output_logits = loaded_model.layers[last_layer].output.shape[-1]\n",
    "    assert label<output_logits\n",
    "\n",
    "    logits_layer = loaded_model.layers[last_layer]\n",
    "    out = Dense(2, activation=None, name='classif')(loaded_model.layers[last_layer].output)\n",
    "\n",
    "    last_weights  = np.zeros((output_logits,2))\n",
    "    last_weights[label,:] = reverse * np.asarray([[-1, 1]])\n",
    "\n",
    "    model = tf.keras.Model(loaded_model.inputs, out)\n",
    "    \n",
    "    model.layers[-1].set_weights([last_weights, np.asarray([reverse * biais, -reverse * biais])])\n",
    "    model.built = True\n",
    "    return model"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {
    "id": "MpJoZtbS7LUI"
   },
   "source": [
    "# Loading Model and preparing dataset"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 29316,
     "status": "ok",
     "timestamp": 1652363052099,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "LNzbg_AxA_T-",
    "outputId": "db10e256-084c-426c-c3a9-49e9b95347d3"
   },
   "outputs": [],
   "source": [
    "model_name = \"model_22labels_unconstrained_epoch100_fullmodel\"\n",
    "chosen_label_name = 'Mustache' #'Wearing_Hat' # 'Gray_Hair'  #'Bald' #'Heavy_Makeup' #'Wearing_Lipstick' #'Mustache'\n",
    "chosen_label = np.argmax(np.asarray(class_names)[all_selected_classes]==chosen_label_name)\n",
    "\n",
    "model = load_network(model_path,model_name)\n",
    "binary_model = make_binary_classif_model(model, last_layer=-1, label=chosen_label)   \n",
    "\n",
    "loss = tf.keras.losses.BinaryCrossentropy(from_logits=True)\n",
    "#HKR_multilabel(alpha = alphaHKR,  min_margin=min_margin)\n",
    "\n",
    "binary_model.compile(loss=loss, metrics=[\"accuracy\"], optimizer=optimizers.Adam(learning_rate=learning_rate))\n",
    "\n",
    "ds_binary = make_binary_dataset(make_ds(), chosen_label_name)\n",
    "binary_model.evaluate(ds_binary.batch(256))"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {
    "id": "0a-8rud_-DYu"
   },
   "source": [
    "# Test gradient explanations"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000,
     "output_embedded_package_id": "1oAm7LesKydOcF7Lr0vF7kOLsOORB1Luc"
    },
    "executionInfo": {
     "elapsed": 42165,
     "status": "ok",
     "timestamp": 1652349370251,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "GgadbIoP7J4N",
    "outputId": "9c345121-4775-4b2a-82cd-53c216c8989c"
   },
   "outputs": [],
   "source": [
    "explainer = Saliency(binary_model, batch_size=128)\n",
    "set_size(20, 20)\n",
    "\n",
    "phis = None\n",
    "for bx, by in ds_binary.batch(25).take(1):\n",
    "  phis = explainer(bx, by)\n",
    "  \n",
    "  i = 0\n",
    "  for x,y,h in zip(bx, by, phis):\n",
    "    plt.subplot(5, 5, i+1)\n",
    "    show(x)\n",
    "    show(h, cmap='jet', alpha=0.4, p=0.5, smooth=False)\n",
    "    i+=1\n",
    "  plt.savefig('non_robust_grad.png', dpi=300)\n",
    "  plt.show()\n"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {
    "id": "scJyLDqw-F6L"
   },
   "source": [
    "# (1) Computing Explanations Metrics"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "EDuujeAe-FYi"
   },
   "outputs": [],
   "source": [
    "from xplique.attributions import (Saliency, GradientInput, GradCAM, IntegratedGradients, \n",
    "                                  SmoothGrad, VarGrad, SquareGrad, Occlusion, Rise, \n",
    "                                  GuidedBackprop, GradCAMPP, Lime, KernelShap, SobolAttributionMethod)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 11055195,
     "status": "ok",
     "timestamp": 1651963915583,
     "user": {
      "displayName": "River Dread",
      "userId": "09094954806195578933"
     },
     "user_tz": -120
    },
    "id": "NjggdtAN7Zve",
    "outputId": "12689372-883a-4a28-b85a-00e95d1f4b68"
   },
   "outputs": [],
   "source": [
    "nb_elements = 1000\n",
    "batch_size  = 256\n",
    "\n",
    "X_test = []\n",
    "Y_test = []\n",
    "\n",
    "for x,y in ds_binary.take(nb_elements):\n",
    "  X_test.append(x)\n",
    "  Y_test.append(y)\n",
    "\n",
    "X_test = np.array(X_test, np.float32)\n",
    "Y_test = np.array(Y_test, np.float32)\n",
    "\n",
    "np.save('X_test.npy', X_test)\n",
    "np.save('Y_test.npy', Y_test)\n",
    "\n",
    "explainers = [\n",
    "              Saliency(binary_model, -1, batch_size = batch_size),\n",
    "              GradientInput(binary_model, -1, batch_size = batch_size),\n",
    "              GradCAM(binary_model, -1, batch_size = batch_size),\n",
    "              GradCAMPP(binary_model, -1, batch_size = batch_size),\n",
    "              IntegratedGradients(binary_model, -1, steps = 20, batch_size = batch_size),\n",
    "              SmoothGrad(binary_model, -1, nb_samples = 20, batch_size = batch_size),\n",
    "              VarGrad(binary_model, -1, nb_samples = 20, batch_size = batch_size),\n",
    "              SquareGrad(binary_model, -1, nb_samples = 20, batch_size = batch_size),\n",
    "              Occlusion(binary_model, batch_size = batch_size, patch_size=10, patch_stride=10),\n",
    "              Rise(binary_model, batch_size = batch_size, nb_samples = 3000),\n",
    "              SobolAttributionMethod(binary_model, nb_design = 32, batch_size = batch_size, grid_size = 7),\n",
    "]\n",
    "\n",
    "for explainer in explainers:\n",
    "  explainer_name = explainer.__class__.__name__\n",
    "  phis = explainer(X_test, Y_test)\n",
    "\n",
    "  phis = np.abs(phis)\n",
    "  if len(phis.shape) == 4:\n",
    "    phis = np.max(phis, -1)\n",
    "  \n",
    "  if phis.shape[1] != X_test.shape[1]:\n",
    "    phis = np.moveaxis(phis, 1, 2)\n",
    "  \n",
    "  phis = np.array(phis, np.float16)\n",
    "\n",
    "  np.save(f'{model_name}_{explainer_name}.npy', phis) \n",
    "  print('done for ', explainer_name, phis.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 892,
     "status": "ok",
     "timestamp": 1652363052987,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "p65nzdy2YCZr",
    "outputId": "1b203e9a-6c65-42b7-cf38-8098ff5808fb"
   },
   "outputs": [],
   "source": [
    "metric_model = load_network(model_path,model_name)\n",
    "metric_model = make_binary_classif_model(metric_model, last_layer=-1, label=chosen_label)   \n",
    "metric_model.layers[-1].activation = tf.keras.activations.softmax"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5,
     "status": "ok",
     "timestamp": 1652349663774,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "f9ROcDVouSr3",
    "outputId": "a15a7578-5f03-4e98-c011-3399b5e500b4"
   },
   "outputs": [],
   "source": [
    "!cp *.npy \"/content/drive/MyDrive/HKR XAI/data\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1120354,
     "status": "ok",
     "timestamp": 1651965101295,
     "user": {
      "displayName": "River Dread",
      "userId": "09094954806195578933"
     },
     "user_tz": -120
    },
    "id": "XJicd5ls_j-9",
    "outputId": "acd3366e-47bf-4858-afa2-70a6e74a7104"
   },
   "outputs": [],
   "source": [
    "from xplique.metrics import MuFidelity, Deletion, Insertion\n",
    "\n",
    "x_max, x_min = X_test.max(), X_test.min()\n",
    "baseline_zero    = 0.0\n",
    "baseline_uniform = lambda x: np.random.uniform(size=x.shape) * (x_max-x_min) - x_min \n",
    "\n",
    "metrics = [\n",
    "           MuFidelity(binary_model, X_test, Y_test, batch_size = batch_size, grid_size = 8, nb_samples = 50, baseline_mode = baseline_uniform),\n",
    "           Deletion(binary_model, X_test, Y_test, steps = 6, baseline_mode = baseline_uniform),\n",
    "           Insertion(binary_model, X_test, Y_test, steps = 6, baseline_mode = baseline_uniform),\n",
    "]\n",
    "\n",
    "for metric in metrics:\n",
    "  metric_name = metric.__class__.__name__\n",
    "  table = []\n",
    "  \n",
    "  for explainer in explainers:\n",
    "    explainer_name = explainer.__class__.__name__ \n",
    "    phis = np.load(f'{model_name}_{explainer_name}.npy')\n",
    "    phis = tf.cast(phis, tf.float32)[:,:,:,None]\n",
    "\n",
    "    score = metric(phis)\n",
    "    table.append((metric_name, model_name, explainer_name, score))\n",
    "    print(metric_name, explainer_name, score)\n",
    "  \n",
    "  np.save(f'results_{model_name}_{metric_name}_uniform', table)\n",
    "  print('\\n\\n')\n",
    "    \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1041419,
     "status": "ok",
     "timestamp": 1651966142692,
     "user": {
      "displayName": "River Dread",
      "userId": "09094954806195578933"
     },
     "user_tz": -120
    },
    "id": "Vp-Y1V4zSf0Z",
    "outputId": "e51b5279-a699-490c-9a12-ce65383daff1"
   },
   "outputs": [],
   "source": [
    "from xplique.metrics import MuFidelity, Deletion, Insertion\n",
    "\n",
    "x_max, x_min = X_test.max(), X_test.min()\n",
    "baseline_zero    = 0.0\n",
    "baseline_uniform = lambda x: np.random.uniform(size=x.shape) * (x_max-x_min) - x_min \n",
    "\n",
    "metrics = [\n",
    "           MuFidelity(binary_model, X_test, Y_test, batch_size = batch_size, grid_size = 8, nb_samples = 50, baseline_mode = baseline_zero),\n",
    "           Deletion(binary_model, X_test, Y_test, steps = 6, baseline_mode = baseline_zero),\n",
    "           Insertion(binary_model, X_test, Y_test, steps = 6, baseline_mode = baseline_zero),\n",
    "]\n",
    "\n",
    "for metric in metrics:\n",
    "  metric_name = metric.__class__.__name__\n",
    "  table = []\n",
    "  \n",
    "  for explainer in explainers:\n",
    "    explainer_name = explainer.__class__.__name__ \n",
    "    phis = np.load(f'{model_name}_{explainer_name}.npy')\n",
    "    phis = tf.cast(phis, tf.float32)[:,:,:,None]\n",
    "\n",
    "    score = metric(phis)\n",
    "    table.append((metric_name, model_name, explainer_name, score))\n",
    "    print(metric_name, explainer_name, score)\n",
    "  \n",
    "  np.save(f'results_{model_name}_{metric_name}_zero', table)\n",
    "  print('\\n\\n')\n",
    "    \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "Ayh5DuKi5RXW"
   },
   "outputs": [],
   "source": [
    "!cp results_* \"/content/drive/MyDrive/HKR XAI/results\""
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {
    "id": "lO9yVJJ2U0gq"
   },
   "source": [
    "# (2)Robustness-sr"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "Pwhyk6U8kHKx"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 357,
     "status": "ok",
     "timestamp": 1652367417160,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "2U5orZWBVjeB"
   },
   "outputs": [],
   "source": [
    "\n",
    "def epsilons_l2(dimensions, epsilon, nb_samples, masks):\n",
    "  normal_deviations = np.random.normal(size=(nb_samples, dimensions))\n",
    "  radius = np.linalg.norm(normal_deviations, axis=1, keepdims=True)\n",
    "  normal_deviations = normal_deviations * (np.random.rand(nb_samples, dimensions) ** (1.0 / dimensions))\n",
    "\n",
    "  points = normal_deviations * epsilon / radius\n",
    "  samples = tf.cast(points * masks, tf.float32)\n",
    "\n",
    "  return samples\n",
    "\n",
    "@tf.function\n",
    "def _pgd_step(model, inputs, labels):\n",
    "  with tf.GradientTape() as tape:\n",
    "    tape.watch(inputs)\n",
    "    outputs = model(inputs) \n",
    "    loss = tf.keras.losses.binary_crossentropy(labels, outputs, from_logits=False)\n",
    "\n",
    "  grads = tape.gradient(loss, inputs)\n",
    "  return grads, loss\n",
    "\n",
    "\n",
    "def _pgd_projection(grads, step_size, adversarials, inputs, epsilons):\n",
    "    grad_l2_norm = tf.linalg.norm(tf.reshape(grads, (len(grads), -1)), axis=-1)\n",
    "    grad_l2_norm = grad_l2_norm[:, tf.newaxis, tf.newaxis, tf.newaxis]\n",
    "    grads = grads * step_size / grad_l2_norm\n",
    "\n",
    "    adversarials += grads\n",
    "    delta = adversarials - inputs\n",
    "\n",
    "    # project the element to the closest point of the l2 ball if necessary\n",
    "    delta_norm = tf.linalg.norm(tf.reshape(delta, (len(delta), -1)), axis=-1)\n",
    "    need_projection = tf.cast(delta_norm <= epsilons, tf.float32)\n",
    "    \n",
    "    scaling_factor = delta_norm * (1.0 - need_projection) + epsilons * need_projection\n",
    "\n",
    "    delta *= tf.reshape(epsilons / scaling_factor, (len(epsilons), 1, 1, 1))\n",
    "\n",
    "    return delta\n",
    "\n",
    "@tf.function\n",
    "def _iter_delta(model, adversarials, labels, masks, step_size, inputs, epsilons):\n",
    "  grads, loss = _pgd_step(model, adversarials, labels)\n",
    "  grads *= masks\n",
    "\n",
    "  delta = _pgd_projection(grads, step_size, adversarials, inputs, epsilons)\n",
    "  return delta\n",
    "\n",
    "#@tf.function\n",
    "def projected_gradient_descent(model, inputs, labels, epsilons, masks, \n",
    "                               iterations=100, step_size=1e-2):\n",
    "  \n",
    "  adversarials = tf.cast(inputs, tf.float32)\n",
    "  inputs = tf.cast(inputs, tf.float32)\n",
    "  masks = tf.cast(masks, tf.float32)\n",
    "\n",
    "  epsilons_step = epsilons / iterations\n",
    "  #print('epsilons_step', epsilons_step)\n",
    "\n",
    "  #print('masks ? ', masks.shape)\n",
    "  \"\"\"\n",
    "  for iteration_i in tf.range(iterations):\n",
    "    grads, _ = _pgd_step(model, adversarials, labels)\n",
    "    grads = grads * masks\n",
    "    \n",
    "    scaler = tf.reduce_sum(tf.abs(grads), (1, 2, 3))\n",
    "    scaler = scaler\n",
    "    scaler = scaler[:, None, None, None]\n",
    "\n",
    "    grads = grads / scaler * epsilons_step[:, None, None, None]\n",
    "    #grads = grads\n",
    "    #print('applying grad of norm', tf.reduce_sum(tf.abs(grads), (1,2,3)), \"epsilons:\", epsilons)\n",
    "    adversarials = adversarials + grads \n",
    "\n",
    "  print('adversarial / inputs differences', tf.reduce_sum(tf.abs(adversarials - inputs), (1,2,3)) ) \n",
    "  \"\"\"\n",
    "  \n",
    "  for iteration_i in tf.range(iterations):\n",
    "    delta = _iter_delta(model, adversarials, labels, masks, step_size, inputs, epsilons)\n",
    "    adversarials += delta\n",
    "  \n",
    "  #adversarials = tf.clip_by_value(adversarials, -1.0, 1.0)\n",
    "  success = tf.argmax(model(inputs), -1) != tf.argmax(model(adversarials), -1)\n",
    "\n",
    "  return success, adversarials"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 2,
     "status": "ok",
     "timestamp": 1652367417920,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "IzyNPRuC0xAj"
   },
   "outputs": [],
   "source": [
    "def pgd_bisection(model, inputs, masks, labels,\n",
    "                  start_epsilon=1e-3,\n",
    "                  tolerance=1e-5, max_steps=100, \n",
    "                  upscale_rate=10.0, downscale_rate=10.0,\n",
    "                  iterations=10):\n",
    "  \"\"\"\n",
    "  Bisection algorithm to find the min epsilon\n",
    "  \"\"\"\n",
    "  nb_elements = len(inputs)\n",
    "\n",
    "  upper_not_found = np.ones(nb_elements)\n",
    "  upper_epsilons = np.full(nb_elements, np.inf)\n",
    "  lower_not_found = np.ones(nb_elements)\n",
    "  lower_epsilons = np.full(nb_elements, -np.inf)\n",
    "\n",
    "  epsilons = np.ones(nb_elements, dtype=np.float32) * start_epsilon\n",
    "\n",
    "  optimal_adversarials = np.zeros(inputs.shape)\n",
    "\n",
    "  step = 0\n",
    "  # we start with all element\n",
    "  ids_to_finds = np.arange(nb_elements)\n",
    "\n",
    "  while len(ids_to_finds):\n",
    "    successes, adversarials = projected_gradient_descent(model, inputs[ids_to_finds], labels[ids_to_finds], \n",
    "                                                         epsilons=epsilons[ids_to_finds], masks=masks[ids_to_finds],\n",
    "                                                         iterations=iterations)\n",
    "    \n",
    "    #print('one pgd done', len(ids_to_finds), epsilons)\n",
    "\n",
    "    for i, input_id in enumerate(ids_to_finds):\n",
    "      eps = epsilons[input_id]\n",
    "\n",
    "      if successes[i]:\n",
    "        # update the current adversarial\n",
    "        optimal_adversarials[input_id] = adversarials[i]\n",
    "        # we have an adv, so it's an epsilon upper-bound\n",
    "        upper_epsilons[input_id] = epsilons[input_id]\n",
    "\n",
    "        if lower_not_found[input_id]:\n",
    "          # if we have not found a lower bound, we keep decreasing\n",
    "          epsilons[input_id] /= downscale_rate \n",
    "        else:\n",
    "          # we already reach a lower bound, so we shouldn't divide by downscale\n",
    "          epsilons[input_id] =  0.5 * (lower_epsilons[input_id] + upper_epsilons[input_id])\n",
    "\n",
    "        upper_not_found[input_id] = False\n",
    "      \n",
    "      else:\n",
    "        # we have not found an adv, so it's an epsilon lower-bound\n",
    "        lower_epsilons[input_id] = epsilons[input_id]\n",
    "\n",
    "        if upper_not_found[input_id]:\n",
    "          # if we have not found an adv yet, we keep increasing\n",
    "          epsilons[input_id] *= upscale_rate \n",
    "        else:\n",
    "          # we already have and adv, we should go slower\n",
    "          epsilons[input_id] =  0.5 * (lower_epsilons[input_id] + upper_epsilons[input_id])\n",
    "\n",
    "        lower_not_found[input_id] = False\n",
    "    \n",
    "    step += 1\n",
    "    ids_not_found = (upper_epsilons - lower_epsilons) > tolerance\n",
    "    ids_to_finds = np.arange(nb_elements)[ids_not_found]\n",
    "    \n",
    "    if step >= max_steps:\n",
    "        break\n",
    "\n",
    "  return upper_epsilons, optimal_adversarials\n",
    "\n",
    "def robustness_sr(model, inputs, phis, labels, start_epsilon=5e-3,\n",
    "                  tolerance=5e-5, max_steps=25, \n",
    "                  upscale_rate=10.0, downscale_rate=10.0,\n",
    "                  iterations=100,\n",
    "                  verbose=False):\n",
    "    inputs = np.array(inputs)\n",
    "    labels = np.array(labels)\n",
    "    phis = np.array(phis)\n",
    "    percents = [0.05 * i for i in range(1, 5)]\n",
    "    \n",
    "    # flatten phis to select the best K-ids\n",
    "    original_shape = phis.shape\n",
    "    phis = np.array(phis).reshape((len(phis), -1))\n",
    "    \n",
    "    epsilons = []\n",
    "\n",
    "    for percent in percents:\n",
    "      masks = np.zeros_like(phis, dtype=np.float32)\n",
    "      for phi_id, phi in enumerate(phis):\n",
    "        to_select = np.argsort(phi)[::-1][:int(len(phi) * percent)]\n",
    "        masks[phi_id, to_select] = 1.0\n",
    "\n",
    "      masks = masks.reshape(original_shape)\n",
    "      #print(\"masks ?\", masks.shape)\n",
    "      eps, _ = pgd_bisection(model, inputs, masks, labels,\n",
    "                             start_epsilon=start_epsilon,\n",
    "                             tolerance=tolerance, max_steps=max_steps, \n",
    "                             upscale_rate=upscale_rate, downscale_rate=downscale_rate,\n",
    "                             iterations=iterations)\n",
    "      \n",
    "      # remove adversarial that has not been found\n",
    "      # avoid inf. value by using a ceil number, could be improved\n",
    "      eps = np.clip(eps, 0, 100.0)\n",
    "      epsilons.append(eps)\n",
    "    if verbose:\n",
    "      print('epsilons:', epsilons)\n",
    "      plt.hist(epsilons, bins=len(epsilons))\n",
    "      plt.xscale('log')\n",
    "      plt.show()\n",
    "    \n",
    "    avg_epsilon = np.mean(epsilons, -1)\n",
    "    auc = np.mean(avg_epsilon[:-1] + avg_epsilon[1:]) * 0.5 # trapezoidal rule\n",
    "\n",
    "    return auc"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 1153,
     "status": "ok",
     "timestamp": 1652367420234,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "i2OHYGNqYCQm"
   },
   "outputs": [],
   "source": [
    "X_test, Y_test = np.load('data/X_test.npy'), np.load('data/Y_test.npy')\n",
    "Y_test = tf.one_hot(np.argmax(metric_model.predict(X_test, batch_size = 256), -1), 2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 485
    },
    "executionInfo": {
     "elapsed": 559800,
     "status": "error",
     "timestamp": 1652367985650,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "EQUANJmdwJ5z",
    "outputId": "f99fd648-bc33-4090-c7eb-41923943e829"
   },
   "outputs": [],
   "source": [
    "from xplique.metrics import MuFidelity, Deletion, Insertion\n",
    "\n",
    "metric_name = 'robustness_sr'\n",
    "table = []\n",
    "\n",
    "l = 32\n",
    "\n",
    "for explainer_name in explainers_names:\n",
    "  #explainer_name = explainer.__class__.__name__ \n",
    "  phis = np.load(f'data/{model_name}_{explainer_name}.npy')\n",
    "  phis = tf.cast(phis, tf.float32)[:,:,:,None]\n",
    "\n",
    "  score = robustness_sr(metric_model, X_test[:l], phis[:l], Y_test[:l], \n",
    "                        start_epsilon = 0.1, tolerance = 1e-2, max_steps = 5,\n",
    "                        iterations = 100)\n",
    "\n",
    "  #score = metric(phis)\n",
    "  table.append((metric_name, model_name, explainer_name, score))\n",
    "  print(metric_name, explainer_name, score)\n",
    "\n",
    "np.save(f'results_{model_name}_{metric_name}', table)\n",
    "print('\\n\\n')\n",
    "    \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "6_N214FOg9zf"
   },
   "outputs": [],
   "source": [
    "!cp -r \"/content/drive/MyDrive/HKR XAI/data\" ./"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 1326,
     "status": "ok",
     "timestamp": 1652363934586,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "w0ewoU58gqpy"
   },
   "outputs": [],
   "source": [
    "explainers_names = [p for p in os.listdir('data') if 'results' not in p and 'model' in p]\n",
    "explainers_names = [p for p in explainers_names if model_name in p]\n",
    "explainers_names = [p.split('_')[-1].split('.npy')[0] for p in explainers_names]\n",
    "explainers_names\n",
    "\n",
    "X_test, Y_test = np.load('data/X_test.npy'), np.load('data/Y_test.npy')\n",
    "Y_test = tf.one_hot(np.argmax(metric_model.predict(X_test, batch_size = 256), -1), 2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 627
    },
    "executionInfo": {
     "elapsed": 663879,
     "status": "error",
     "timestamp": 1651999531535,
     "user": {
      "displayName": "River Dread",
      "userId": "09094954806195578933"
     },
     "user_tz": -120
    },
    "id": "-ZeuPxVFU3X4",
    "outputId": "c44e21bd-f96c-47a2-ae84-ddeaf7742964"
   },
   "outputs": [],
   "source": [
    "from xplique.metrics import MuFidelity, Deletion, Insertion\n",
    "\n",
    "metric_name = 'robustness_sr'\n",
    "table = []\n",
    "\n",
    "l = 1000\n",
    "\n",
    "for explainer in explainers:\n",
    "  explainer_name = explainer.__class__.__name__ \n",
    "  phis = np.load(f'{model_name}_{explainer_name}.npy')\n",
    "  phis = tf.cast(phis, tf.float32)[:,:,:,None]\n",
    "\n",
    "  score = robustness_sr(metric_model, X_test[:l], phis[:l], Y_test[:l], \n",
    "                        start_epsilon = 5e-3, tolerance = 1e-4, max_steps = 25,\n",
    "                        iterations = 50)\n",
    "\n",
    "  table.append((metric_name, model_name, explainer_name, score))\n",
    "  print(metric_name, explainer_name, score)\n",
    "\n",
    "np.save(f'results_{model_name}_{metric_name}', table)\n",
    "print('\\n\\n')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "L6JEiFhxgpVx"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "8YsIgogd2GMi"
   },
   "outputs": [],
   "source": [
    "np.save(f'results_{model_name}_{metric_name}', table)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "VstSvGlyL8PQ"
   },
   "outputs": [],
   "source": [
    "!cp results_* \"/content/drive/MyDrive/HKR XAI/results\""
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {
    "id": "G7WXaleiOz5V"
   },
   "source": [
    "# (2.bis) MuFidelity re-run"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 33788,
     "status": "ok",
     "timestamp": 1652363117745,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "gx-9p2ZhPAaf"
   },
   "outputs": [],
   "source": [
    "!cp -r \"/content/drive/MyDrive/HKR XAI/data\" ./"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 231,
     "status": "ok",
     "timestamp": 1652368344918,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "99O8n9RGO8O8"
   },
   "outputs": [],
   "source": [
    "X_test, Y_test = np.load('data/X_test_robust.npy'), np.load('data/Y_test_robust.npy')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4,
     "status": "ok",
     "timestamp": 1652368345623,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "sHxrqwSBQ9M_",
    "outputId": "de7df1da-0f7a-41da-835c-a1d4a8976d46"
   },
   "outputs": [],
   "source": [
    "explainers_names = [p for p in os.listdir('data') if 'results' not in p and 'model' in p]\n",
    "explainers_names = [p for p in explainers_names if model_name in p]\n",
    "explainers_names = [p.split('_')[-1].split('.npy')[0] for p in explainers_names]\n",
    "explainers_names"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4,
     "status": "ok",
     "timestamp": 1652349719737,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "MMeLkvUBRyoE",
    "outputId": "8f2286ea-20b2-42a1-84f5-a81b62f21780"
   },
   "outputs": [],
   "source": [
    "phis.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 217902,
     "status": "ok",
     "timestamp": 1652350556931,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "fOg8SAMfO3Qd",
    "outputId": "e13d4521-24ce-41c6-b850-2da61fda6bab"
   },
   "outputs": [],
   "source": [
    "from xplique.metrics import MuFidelity, Deletion, Insertion\n",
    "\n",
    "l = 1000\n",
    "batch_size  = 128\n",
    "\n",
    "x_max, x_min = X_test.max(), X_test.min()\n",
    "baseline_zero    = 0.0\n",
    "baseline_uniform = lambda x: np.random.uniform(size=x.shape) * (x_max-x_min) - x_min \n",
    "\n",
    "for grid_size in [20]:\n",
    "\n",
    "  metric = MuFidelity(binary_model, X_test[:l], Y_test[:l], batch_size = batch_size, grid_size = grid_size, nb_samples = 200, baseline_mode = baseline_zero)\n",
    "  metric_name = metric.__class__.__name__\n",
    "\n",
    "  table = []\n",
    "  \n",
    "  for explainer_name in explainers_names:\n",
    "    #explainer_name = explainer.__class__.__name__ \n",
    "    phis = np.load(f'data/{model_name}_{explainer_name}.npy')[:l]\n",
    "    phis = tf.cast(phis, tf.float32)[:,:,:,None]\n",
    "\n",
    "    score = metric(phis)\n",
    "    table.append((metric_name, model_name, explainer_name, score))\n",
    "    print(metric_name, explainer_name, score)\n",
    "  \n",
    "  np.save(f'results_{model_name}_{metric_name}_zero_{grid_size}', table)\n",
    "  print('done for ', grid_size)\n",
    "  print('\\n\\n')\n",
    "    \n"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {
    "id": "X2YHKZQEyYzU"
   },
   "source": [
    "# Saliency / SmoothGrad"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 3,
     "status": "ok",
     "timestamp": 1652351135749,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "aT6SVmgyycK_"
   },
   "outputs": [],
   "source": [
    "l = 200\n",
    "sa_phis = np.load(f'data/{model_name}_Saliency.npy')[:l]\n",
    "sa_phis = tf.cast(sa_phis, tf.float32)[:,:,:]\n",
    "\n",
    "sg_phis = np.load(f'data/{model_name}_SmoothGrad.npy')[:l]\n",
    "sg_phis = tf.cast(sg_phis, tf.float32)[:,:,:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4,
     "status": "ok",
     "timestamp": 1652351123069,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "j_dp3wQvyzeV",
    "outputId": "0b13c01b-2271-45b0-cfd1-29769520840d"
   },
   "outputs": [],
   "source": [
    "sa_phis.shape, sg_phis.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 369,
     "output_embedded_package_id": "1qyHujV9k14PfjUcHaBsSVQ7IkEW0OY0I"
    },
    "executionInfo": {
     "elapsed": 13195,
     "status": "ok",
     "timestamp": 1652351287909,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "dK-fTxrZy1Y8",
    "outputId": "19678425-b9a8-4f6f-90c0-46d389bb46d2"
   },
   "outputs": [],
   "source": [
    "set_size(20, 5)\n",
    "\n",
    "j = 10\n",
    "\n",
    "for i in range(5):\n",
    "  plt.subplot(2, 5, i+1)\n",
    "  show(X_test[i+j])\n",
    "  show(sa_phis[i+j], cmap='jet', alpha=0.4, p=0.5)\n",
    "  plt.subplot(2, 5, 5+i+1)\n",
    "  show(X_test[i+j])\n",
    "  show(sg_phis[i+j], cmap='jet', alpha=0.4, p=0.5)\n",
    "\n",
    "plt.tight_layout()\n",
    "plt.savefig('sa_vs_sg_non_robust.png', dpi=300)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 13782,
     "status": "ok",
     "timestamp": 1652352089432,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "OCkkc6ko26Td",
    "outputId": "3838c500-2cc7-4d43-8564-9240eaaa0835"
   },
   "outputs": [],
   "source": [
    "import scipy\n",
    "from scipy.stats import spearmanr\n",
    "\n",
    "l = 1000\n",
    "sa_phis = np.load(f'data/{model_name}_Saliency.npy')\n",
    "sa_phis = tf.cast(sa_phis, tf.float32).numpy()\n",
    "\n",
    "sg_phis = np.load(f'data/{model_name}_SmoothGrad.npy')\n",
    "sg_phis = tf.cast(sg_phis, tf.float32).numpy()\n",
    "\n",
    "spearman_dist = []\n",
    "l2_dist = []\n",
    "\n",
    "for h1, h2 in zip(sg_phis, sa_phis):\n",
    "  spearman_dist.append(spearmanr(h1.flatten(), h2.flatten())[0])\n",
    "  l2_dist.append(np.mean(np.sqrt(np.square(h1 - h2))))\n",
    "\n",
    "np.save('sa_sg_spearman_non_robust.npy', np.array(spearman_dist))\n",
    "np.save('sa_sg_l2_non_robust.npy', np.array(l2_dist))\n",
    "\n",
    "print('mean spearman', np.mean(spearman_dist), \"Mean l2\", np.mean(l2_dist))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "oPMogEZp4AjH"
   },
   "outputs": [],
   "source": []
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {
    "id": "HLTZfq0d3Pci"
   },
   "source": [
    "# Kolmogorov estimation\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4360,
     "status": "ok",
     "timestamp": 1652352462912,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "RyJgerlJ3Rd3",
    "outputId": "56e3ebcc-68be-4068-cbde-c52b3b335189"
   },
   "outputs": [],
   "source": [
    "import cv2\n",
    "\n",
    "sizes = []\n",
    "\n",
    "sa_phis = np.load(f'data/{model_name}_Saliency.npy')\n",
    "\n",
    "for phi in sa_phis:\n",
    "  phi -= phi.min()\n",
    "  phi /= phi.max()\n",
    "  phi *= 255.0\n",
    "  phi = np.array(phi).astype(np.uint8)\n",
    "\n",
    "  cv2.imwrite('img.jpg', phi)\n",
    "  sz = os.path.getsize(\"img.jpg\")\n",
    "\n",
    "  sizes.append(sz)\n",
    "\n",
    "np.save('robust_saliency_jpg_size.npy', sizes)\n",
    "print('mean bytes size', np.mean(sizes), \"std\", np.std(sizes))\n",
    "print('mean kilo-bytes', np.mean(sizes) / 1_000, \"std\", np.std(sizes) / 1_000)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "JLCZFrPHgdVd",
    "outputId": "f34fa76f-174e-4cf5-a98a-7493aadc6b72"
   },
   "outputs": [],
   "source": [
    "from xplique.metrics import MuFidelity, Deletion, Insertion\n",
    "\n",
    "l = 1000\n",
    "batch_size  = 128\n",
    "\n",
    "x_max, x_min = X_test.max(), X_test.min()\n",
    "baseline_zero    = 0.0\n",
    "baseline_uniform = lambda x: np.random.uniform(size=x.shape) * (x_max-x_min) - x_min \n",
    "\n",
    "grid_size = 20\n",
    "\n",
    "metric = MuFidelity(binary_model, X_test[:l], Y_test[:l], batch_size = batch_size, grid_size = grid_size, nb_samples = 250, baseline_mode = baseline_uniform)\n",
    "metric_name = metric.__class__.__name__\n",
    "\n",
    "table = []\n",
    "\n",
    "for explainer_name in explainers_names:\n",
    "  #explainer_name = explainer.__class__.__name__ \n",
    "  phis = np.load(f'data/{model_name}_{explainer_name}.npy')[:l]\n",
    "  phis = tf.cast(phis, tf.float32)[:,:,:,None]\n",
    "\n",
    "  score = metric(phis)\n",
    "  table.append((metric_name, model_name, explainer_name, score))\n",
    "  print(metric_name, explainer_name, score)\n",
    "\n",
    "\n",
    "filename = f'results_{model_name}_{metric_name}_uniform'\n",
    "np.save(filename, table)\n",
    "print('done for ', grid_size)\n",
    "print('\\n\\n')\n",
    "!cp {filename} \"/content/drive/MyDrive/HKR XAI/results\"\n",
    "    \n"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {
    "id": "c_5FiAHUU3vC"
   },
   "source": [
    "# (3) Stability"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 81983,
     "status": "ok",
     "timestamp": 1652369091534,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "aG9FYbeVU5fl",
    "outputId": "4e7554b5-db22-4f3e-c5b8-2aa97ec08a0a"
   },
   "outputs": [],
   "source": [
    "from scipy.stats import spearmanr\n",
    "\n",
    "l = 500\n",
    "\n",
    "def spearman_dist(phi1, phi2):\n",
    "  if len(phi1.shape) == 3:\n",
    "    phi1 = np.mean(phi1, -1)\n",
    "    phi2 = np.mean(phi2, -1)\n",
    "  return 1.0 - np.abs(spearmanr(np.array(phi1).flatten(), np.array(phi2).flatten()))\n",
    "\n",
    "def l2_dist(phi1, phi2):\n",
    "  if len(phi1.shape) == 3:\n",
    "    phi1 = np.mean(phi1, -1)\n",
    "    phi2 = np.mean(phi2, -1)\n",
    "  return np.mean((phi1 - phi2)**2.0)\n",
    "\n",
    "metric = AverageStability(binary_model, X_test[:l], Y_test[:l], batch_size = 128, radius = 0.1, \n",
    "                          distance = spearman_dist, nb_samples = 10)\n",
    "\n",
    "results = []\n",
    "\n",
    "for explainer in [\n",
    "                  Saliency(binary_model),\n",
    "                  IntegratedGradients(binary_model, steps = 80),\n",
    "                  SmoothGrad(binary_model, nb_samples = 80)\n",
    "]:\n",
    "  explainer_name = explainer.__class__.__name__\n",
    "  \n",
    "  score = metric.evaluate(explainer)\n",
    "  results.append((explainer_name, score))\n",
    "  print(explainer_name, score)\n",
    "\n",
    "np.save('stability_spearman_non_robust.npy', results)\n",
    "\n",
    "from scipy.stats import spearmanr\n",
    "\n",
    "\n",
    "metric = AverageStability(binary_model, X_test[:l], Y_test[:l], batch_size = 128, radius = 0.1, \n",
    "                          distance = l2_dist, nb_samples = 10)\n",
    "\n",
    "results = []\n",
    "\n",
    "for explainer in [\n",
    "                  Saliency(binary_model),\n",
    "                  IntegratedGradients(binary_model, steps = 80),\n",
    "                  SmoothGrad(binary_model, nb_samples = 80)\n",
    "]:\n",
    "  explainer_name = explainer.__class__.__name__\n",
    "  \n",
    "  score = metric.evaluate(explainer)\n",
    "  results.append((explainer_name, score))\n",
    "  print(explainer_name, score)\n",
    "\n",
    "np.save('stability_l2_non_robust.npy', results)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "F2p8DuZT1SiN"
   },
   "outputs": [],
   "source": [
    "metric = AverageStability(binary_model, X_test[:l], Y_test[:l], batch_size = 128, radius = 0.1, \n",
    "                          distance = 'l2', nb_samples = 20)\n",
    "\n",
    "results = []\n",
    "\n",
    "for explainer in [\n",
    "                  Saliency(binary_model),\n",
    "                  IntegratedGradients(binary_model, steps = 10),\n",
    "                  SmoothGrad(binary_model, nb_samples = 10)\n",
    "]:\n",
    "  explainer_name = explainer.__class__.__name__\n",
    "  \n",
    "  score = metric.evaluate(explainer)\n",
    "  results.append((explainer_name, score))\n",
    "  print(explainer_name, score)\n",
    "\n",
    "np.save('stability_l2_non_robust.npy', results)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4,
     "status": "ok",
     "timestamp": 1652368359003,
     "user": {
      "displayName": "thomas fel",
      "userId": "05846348858113125044"
     },
     "user_tz": -120
    },
    "id": "TCfWIZBtU6AE",
    "outputId": "f637f4f6-85a1-4b5c-9c1b-5eb274f8c7df"
   },
   "outputs": [],
   "source": [
    "Y_test.shape"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {
    "id": "bVPzPNnWU6Jw"
   },
   "source": [
    "# (4) Kolmogorov Complexity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "b36AX9KdU8lc"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "t0lVdSZyU8_A"
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "accelerator": "GPU",
  "colab": {
   "collapsed_sections": [],
   "machine_shape": "hm",
   "name": "001 (Non Robust) CelebA compute explanations.ipynb",
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.4"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
