{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "a995c4f2",
   "metadata": {},
   "source": [
    "# AUC"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "05adfe85",
   "metadata": {},
   "outputs": [],
   "source": [
    "import my_datasets as md\n",
    "import my_models as mm\n",
    "import my_uncertainty as mu\n",
    "import torch\n",
    "from torch import nn\n",
    "import scipy.stats as stats\n",
    "import numpy as np\n",
    "import pickle\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "from sklearn.metrics import roc_auc_score\n",
    "\n",
    "with open('results.pkl', 'rb') as f: \n",
    "    r = pickle.load(f)\n",
    "\n",
    "plt.rcParams[\"figure.figsize\"] = [20, 4]\n",
    "UNCER_QUANT = [mu.BLOODQuant().name+\"_mean\", mu.BLOODQuant().name+\"_last\", mu.LeastConfidentQuant().name, mu.EntropyQuant().name, mu.MCDropoutQuant().name, mu.GradQuant().name, mu.EnsambleQuant().name, mu.TemperatureScalingQuant().name, mu.MahalanobisQuant().name, \"repr_change_mean\", \"repr_change_last\"]\n",
    "MODELS = [\"RoBERTa\"] \n",
    "NUM_SEEDS = 5\n",
    "\n",
    "def variation(uncer, mode=\"_last\"):\n",
    "    if mode == \"_last\":\n",
    "        return uncer[-1,:]\n",
    "    elif mode == \"_mean\":\n",
    "        return uncer.mean(axis=0)\n",
    "    \n",
    "for data_name, run in r.items():\n",
    "    for model_name in MODELS:\n",
    "        for uncer_name in UNCER_QUANT:\n",
    "            BIO = False\n",
    "            for seed in range(NUM_SEEDS):\n",
    "                if (uncer_name.startswith(mu.BLOODQuant().name) or uncer_name.startswith(\"repr_change\")) and not BIO:\n",
    "                    BIO = True\n",
    "                    mode = uncer_name[-5:]\n",
    "                    uncer_name = uncer_name[:-5]\n",
    "                elif not (uncer_name.startswith(mu.BLOODQuant().name) or uncer_name.startswith(\"repr_change\")):\n",
    "                    mode = \"\"\n",
    "                uncer_id = run[model_name][\"fine-tuned\"][seed][uncer_name][\"id\"]\n",
    "                uncer_id = variation(uncer_id, mode=mode) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_id\n",
    "                uncer_id = -uncer_id if uncer_name == \"repr_change\" else uncer_id\n",
    "                uncer_ood = run[model_name][\"fine-tuned\"][seed][uncer_name][\"ood\"]\n",
    "                uncer_ood = variation(uncer_ood, mode=mode) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_ood\n",
    "                uncer_ood = -uncer_ood if uncer_name == \"repr_change\" else uncer_ood\n",
    "                DATA = [0 for _ in range(len(uncer_id))] + [1 for _ in range(len(uncer_ood))]\n",
    "                aucs.append(roc_auc_score(DATA, uncer_id.tolist()+uncer_ood.tolist()))\n",
    "            fig.show()\n",
    "            aucs = np.array(aucs)\n",
    "            print(f\"{data_name} - {model_name} [{uncer_name+mode}]: AUC = {round(aucs.mean()*100, 2):.2f} $\\pm$ {round(aucs.std()*100, 2):.2f}\")\n",
    "        print()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "40da49d8",
   "metadata": {},
   "outputs": [],
   "source": [
    "import my_datasets as md\n",
    "import my_models as mm\n",
    "import my_uncertainty as mu\n",
    "import torch\n",
    "from torch import nn\n",
    "import scipy.stats as stats\n",
    "import numpy as np\n",
    "import pickle\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "from sklearn.metrics import roc_curve, roc_auc_score\n",
    "\n",
    "with open('results-shifted-sst.pkl', 'rb') as f: \n",
    "    r = pickle.load(f)\n",
    "    \n",
    "plt.rcParams[\"figure.figsize\"] = [20, 4]\n",
    "UNCER_QUANT = [mu.BLOODQuant().name+\"_mean\", mu.BLOODQuant().name+\"_last\", mu.LeastConfidentQuant().name, mu.EntropyQuant().name, mu.MCDropoutQuant().name, mu.GradQuant().name, mu.EnsambleQuant().name, mu.TemperatureScalingQuant().name, mu.MahalanobisQuant().name, \"repr_change_mean\", \"repr_change_last\"]\n",
    "MODELS = [\"RoBERTa\", \"ELECTRA\"] \n",
    "NUM_SEEDS = 5\n",
    "\n",
    "def variation(uncer, mode=\"last\"):\n",
    "    if mode == \"last\":\n",
    "        return uncer[-1,:]\n",
    "    elif mode == \"mean\":\n",
    "        return uncer.mean(axis=0)\n",
    "    \n",
    "for data_name, run in r.items():\n",
    "    for model_name in MODELS:\n",
    "        for uncer_name in UNCER_QUANT:\n",
    "            for seed in range(NUM_SEEDS):               \n",
    "                uncer_id = run[model_name][\"fine-tuned\"][seed][uncer_name][\"id\"]\n",
    "                uncer_id = variation(uncer_id) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_id\n",
    "                uncer_id = -uncer_id if uncer_name == \"repr_change\" else uncer_id\n",
    "                uncer_ood = run[model_name][\"fine-tuned\"][seed][uncer_name][\"shifted\"]\n",
    "                uncer_ood = variation(uncer_ood) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_ood\n",
    "                uncer_ood = -uncer_ood if uncer_name == \"repr_change\" else uncer_ood\n",
    "                \n",
    "                DATA = [0 for _ in range(len(uncer_id))] + [1 for _ in range(len(uncer_ood))]\n",
    "                fpr, tpr, _ = roc_curve(DATA, uncer_id.tolist()+uncer_ood.tolist())\n",
    "                aucs.append(roc_auc_score(DATA, uncer_id.tolist()+uncer_ood.tolist()))\n",
    "            aucs = np.array(aucs)\n",
    "            print(f\"{data_name} - {model_name} [{uncer_name}]: AUC = {round(aucs.mean()*100, 2):.2f} $\\pm$ {round(aucs.std()*100, 2):.2f}\"))\n",
    "        print()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "93f6c47e",
   "metadata": {},
   "source": [
    "# AUPR"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d61939b2",
   "metadata": {},
   "outputs": [],
   "source": [
    "import my_datasets as md\n",
    "import my_models as mm\n",
    "import my_uncertainty as mu\n",
    "import torch\n",
    "from torch import nn\n",
    "import scipy.stats as stats\n",
    "import numpy as np\n",
    "import pickle\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "from sklearn.metrics import auc, precision_recall_curve\n",
    "\n",
    "with open('results.pkl', 'rb') as f: \n",
    "    r = pickle.load(f)\n",
    "    \n",
    "plt.rcParams[\"figure.figsize\"] = [20, 4]\n",
    "UNCER_QUANT = [mu.BLOODQuant().name+\"_mean\", mu.BLOODQuant().name+\"_last\", mu.LeastConfidentQuant().name, mu.EntropyQuant().name, mu.MCDropoutQuant().name, mu.GradQuant().name, mu.EnsambleQuant().name, mu.TemperatureScalingQuant().name, mu.MahalanobisQuant().name]\n",
    "MODELS = [\"ELECTRA\"] \n",
    "NUM_SEEDS = 5\n",
    "\n",
    "def variation(uncer, mode=\"_last\"):\n",
    "    if mode == \"_last\":\n",
    "        return uncer[-1,:]\n",
    "    elif mode == \"_mean\":\n",
    "        return uncer.mean(axis=0)\n",
    "    \n",
    "for data_name, run in r.items():\n",
    "    for model_name in MODELS:\n",
    "        for uncer_name in UNCER_QUANT:\n",
    "            BIO = False\n",
    "            fig, axs = plt.subplots(1, NUM_SEEDS)\n",
    "            if NUM_SEEDS == 1:\n",
    "                axs = [axs]\n",
    "            aucs = []\n",
    "            for seed in range(NUM_SEEDS):\n",
    "                uncer_id = run[model_name][\"fine-tuned\"][seed][uncer_name][\"id\"]\n",
    "                uncer_id = variation(uncer_id, mode=mode) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_id\n",
    "                uncer_id = -uncer_id if uncer_name == \"repr_change\" else uncer_id\n",
    "                uncer_ood = run[model_name][\"fine-tuned\"][seed][uncer_name][\"ood\"]\n",
    "                uncer_ood = variation(uncer_ood, mode=mode) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_ood\n",
    "                uncer_ood = -uncer_ood if uncer_name == \"repr_change\" else uncer_ood\n",
    "                DATA = [1 for _ in range(len(uncer_id))] + [0 for _ in range(len(uncer_ood))]\n",
    "                uncer_id = -uncer_id\n",
    "                uncer_ood = -uncer_ood\n",
    "                precision, recall, _ = precision_recall_curve(DATA, uncer_id.tolist()+uncer_ood.tolist())\n",
    "                aucs.append(auc(recall, precision))\n",
    "            aucs = np.array(aucs)\n",
    "            print(f\"{data_name} - {model_name} [{uncer_name+mode}]: AUPR = {round(aucs.mean()*100, 2):.2f} $\\pm$ {round(aucs.std()*100, 2):.2f}\")\n",
    "        print()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ca4998c5",
   "metadata": {},
   "outputs": [],
   "source": [
    "import my_datasets as md\n",
    "import my_models as mm\n",
    "import my_uncertainty as mu\n",
    "import torch\n",
    "from torch import nn\n",
    "import scipy.stats as stats\n",
    "import numpy as np\n",
    "import pickle\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "from sklearn.metrics import roc_curve, roc_auc_score\n",
    "\n",
    "with open('results-shifted-sst.pkl', 'rb') as f: \n",
    "    r = pickle.load(f)\n",
    "    \n",
    "plt.rcParams[\"figure.figsize\"] = [20, 4]\n",
    "UNCER_QUANT = [mu.BLOODQuant().name+\"_mean\", mu.BLOODQuant().name+\"_last\", mu.LeastConfidentQuant().name, mu.EntropyQuant().name, mu.MCDropoutQuant().name, mu.GradQuant().name, mu.EnsambleQuant().name, mu.TemperatureScalingQuant().name, mu.MahalanobisQuant().name]\n",
    "MODELS = [\"RoBERTa\", \"ELECTRA\"]\n",
    "NUM_SEEDS = 5\n",
    "\n",
    "def variation(uncer, mode=\"last\"):\n",
    "    if mode == \"last\":\n",
    "        return uncer[-1,:]\n",
    "    elif mode == \"mean\":\n",
    "        return uncer.mean(axis=0)\n",
    "    \n",
    "for data_name, run in r.items():\n",
    "    for model_name in MODELS:\n",
    "        for uncer_name in UNCER_QUANT:\n",
    "            if NUM_SEEDS == 1:\n",
    "                axs = [axs]\n",
    "            aucs = []\n",
    "            for seed in range(NUM_SEEDS):               \n",
    "                uncer_id = run[model_name][\"fine-tuned\"][seed][uncer_name][\"id\"]\n",
    "                uncer_id = variation(uncer_id) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_id\n",
    "                uncer_id = -uncer_id if uncer_name == \"repr_change\" else uncer_id\n",
    "                uncer_ood = run[model_name][\"fine-tuned\"][seed][uncer_name][\"shifted\"]\n",
    "                uncer_ood = variation(uncer_ood) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_ood\n",
    "                uncer_ood = -uncer_ood if uncer_name = \"repr_change\" else uncer_ood\n",
    "                \n",
    "                DATA = [1 for _ in range(len(uncer_id))] + [0 for _ in range(len(uncer_ood))]\n",
    "                uncer_id = -uncer_id\n",
    "                uncer_ood = -uncer_ood\n",
    "                precision, recall, _ = precision_recall_curve(DATA, uncer_id.tolist()+uncer_ood.tolist())\n",
    "                aucs.append(auc(recall, precision))\n",
    "            aucs = np.array(aucs)\n",
    "            print(f\"{data_name} - {model_name} [{uncer_name}]: AUPR = {round(aucs.mean()*100, 2):.2f} $\\pm$ {round(aucs.std()*100, 2):.2f}\")\n",
    "        print()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8aa9aaad",
   "metadata": {},
   "source": [
    "# FPR@95TPR"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "d69c01ec",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import torch\n",
    "\n",
    "def fpr95(uncers_id, uncers_ood):\n",
    "    th = np.percentile(uncers_id, 95)\n",
    "    if torch.is_tensor(uncers_ood):\n",
    "        uncers_ood = uncers_ood.cpu().detach().numpy()\n",
    "    return (uncers_ood < th).mean()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "427d9eb8",
   "metadata": {},
   "outputs": [],
   "source": [
    "import my_datasets as md\n",
    "import my_models as mm\n",
    "import my_uncertainty as mu\n",
    "import torch\n",
    "from torch import nn\n",
    "import scipy.stats as stats\n",
    "import numpy as np\n",
    "import pickle\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "from sklearn.metrics import roc_curve, roc_auc_score, auc, precision_recall_curve\n",
    "\n",
    "with open('results.pkl', 'rb') as f: \n",
    "    r = pickle.load(f)\n",
    "    \n",
    "plt.rcParams[\"figure.figsize\"] = [20, 4]\n",
    "UNCER_QUANT = [mu.BLOODQuant().name+\"_mean\", mu.BLOODQuant().name+\"_last\", mu.LeastConfidentQuant().name, mu.EntropyQuant().name, mu.MCDropoutQuant().name, mu.GradQuant().name, mu.EnsambleQuant().name, mu.TemperatureScalingQuant().name, mu.MahalanobisQuant().name]\n",
    "MODELS = [\"ELECTRA\"] \n",
    "NUM_SEEDS = 5\n",
    "\n",
    "def variation(uncer, mode=\"_last\"):\n",
    "    if mode == \"_last\":\n",
    "        return uncer[-1,:]\n",
    "    elif mode == \"_mean\":\n",
    "        return uncer.mean(axis=0)\n",
    "    \n",
    "for data_name, run in r.items():\n",
    "    for model_name in MODELS:\n",
    "        for uncer_name in UNCER_QUANT:\n",
    "            BIO = False\n",
    "            fig, axs = plt.subplots(1, NUM_SEEDS)\n",
    "            if NUM_SEEDS == 1:\n",
    "                axs = [axs]\n",
    "            aucs = []\n",
    "            for seed in range(NUM_SEEDS):\n",
    "                uncer_id = run[model_name][\"fine-tuned\"][seed][uncer_name][\"id\"]\n",
    "                uncer_id = variation(uncer_id, mode=mode) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_id\n",
    "                uncer_id = -uncer_id if uncer_name == \"repr_change\" else uncer_id\n",
    "                uncer_ood = run[model_name][\"fine-tuned\"][seed][uncer_name][\"ood\"]\n",
    "                uncer_ood = variation(uncer_ood, mode=mode) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_ood\n",
    "                uncer_ood = -uncer_ood if uncer_name == \"repr_change\" else uncer_ood\n",
    "                aucs.append(fpr95(uncer_id, uncer_ood))\n",
    "            aucs = np.array(aucs)\n",
    "            print(f\"{data_name} - {model_name} [{uncer_name+mode}]: FPR = {round(aucs.mean()*100, 2):.2f} $\\pm$ {round(aucs.std()*100, 2):.2f}\")\n",
    "        print()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7dec5035",
   "metadata": {},
   "outputs": [],
   "source": [
    "import my_datasets as md\n",
    "import my_models as mm\n",
    "import my_uncertainty as mu\n",
    "import torch\n",
    "from torch import nn\n",
    "import matplotlib.pyplot as plt\n",
    "import scipy.stats as stats\n",
    "import numpy as np\n",
    "import pickle\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "from sklearn.metrics import roc_curve, roc_auc_score\n",
    "\n",
    "with open('results-shifted-sst.pkl', 'rb') as f: \n",
    "    r = pickle.load(f)\n",
    "    \n",
    "plt.rcParams[\"figure.figsize\"] = [20, 4]\n",
    "UNCER_QUANT = [mu.BLOODQuant().name+\"_mean\", mu.BLOODQuant().name+\"_last\", mu.BLOODQuant().name, mu.EntropyQuant().name, mu.MCDropoutQuant().name, mu.GradQuant().name, mu.EnsambleQuant().name, mu.TemperatureScalingQuant().name, mu.MahalanobisQuant().name]\n",
    "MODELS = [\"RoBERTa\", \"ELECTRA\"]\n",
    "NUM_SEEDS = 5\n",
    "\n",
    "def variation(uncer, mode=\"last\"):\n",
    "    if mode == \"last\":\n",
    "        return uncer[-1,:]\n",
    "    elif mode == \"mean\":\n",
    "        return uncer.mean(axis=0)\n",
    "    \n",
    "for data_name, run in r.items():\n",
    "    for model_name in MODELS:\n",
    "        for uncer_name in UNCER_QUANT:\n",
    "            if NUM_SEEDS == 1:\n",
    "                axs = [axs]\n",
    "            aucs = []\n",
    "            for seed in range(NUM_SEEDS):               \n",
    "                uncer_id = run[model_name][\"fine-tuned\"][seed][uncer_name][\"id\"]\n",
    "                uncer_id = variation(uncer_id) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_id\n",
    "                uncer_id = -uncer_id if uncer_name == \"repr_change\" else uncer_id\n",
    "                uncer_ood = run[model_name][\"fine-tuned\"][seed][uncer_name][\"shifted\"]\n",
    "                uncer_ood = variation(uncer_ood) if uncer_name in [\"BLOOD\", \"repr_change\"] else uncer_ood\n",
    "                uncer_ood = -uncer_ood if uncer_name == \"repr_change\" else uncer_ood\n",
    "                \n",
    "                aucs.append(fpr95(uncer_id, uncer_ood))\n",
    "                \n",
    "            aucs = np.array(aucs)\n",
    "            print(f\"{data_name} - {model_name} [{uncer_name}]: AUPR = {round(aucs.mean()*100, 2):.2f} $\\pm$ {round(aucs.std()*100, 2):.2f}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "01e042b6",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
