{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1082,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1906,
     "status": "ok",
     "timestamp": 1694139338627,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Au3Fcvf9ONNZ",
    "outputId": "a87b12f8-d28f-4db6-e61c-610156ff8ac8"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Drive already mounted at /content/gdrive; to attempt to forcibly remount, call drive.mount(\"/content/gdrive\", force_remount=True).\n"
     ]
    }
   ],
   "source": [
    "from google.colab import drive\n",
    "drive.mount('/content/gdrive')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1083,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5436,
     "status": "ok",
     "timestamp": 1694139344061,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "cOzitmuHEa-L",
    "outputId": "aadfd93a-4807-4884-a9cf-420c97765ef2"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requirement already satisfied: PIMS in /usr/local/lib/python3.10/dist-packages (0.6.1)\n",
      "Requirement already satisfied: imageio in /usr/local/lib/python3.10/dist-packages (from PIMS) (2.31.1)\n",
      "Requirement already satisfied: numpy>=1.19 in /usr/local/lib/python3.10/dist-packages (from PIMS) (1.23.5)\n",
      "Requirement already satisfied: slicerator>=0.9.8 in /usr/local/lib/python3.10/dist-packages (from PIMS) (1.1.0)\n",
      "Requirement already satisfied: pillow>=8.3.2 in /usr/local/lib/python3.10/dist-packages (from imageio->PIMS) (9.4.0)\n"
     ]
    }
   ],
   "source": [
    "pip install PIMS"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1085,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5332,
     "status": "ok",
     "timestamp": 1694139355796,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "9WyZRdVSFsvW",
    "outputId": "9f4e5c85-fd85-470a-b3f5-a49b3c0eccd6"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requirement already satisfied: fastcluster in /usr/local/lib/python3.10/dist-packages (1.2.6)\n",
      "Requirement already satisfied: numpy>=1.9 in /usr/local/lib/python3.10/dist-packages (from fastcluster) (1.23.5)\n"
     ]
    }
   ],
   "source": [
    "pip install fastcluster"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1086,
   "metadata": {
    "executionInfo": {
     "elapsed": 7,
     "status": "ok",
     "timestamp": 1694139355797,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "UFN8FbHYOWnl"
   },
   "outputs": [],
   "source": [
    "import torch\n",
    "import numpy as np\n",
    "from torchvision import datasets\n",
    "import torchvision.transforms as transforms\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import torchvision\n",
    "import torch\n",
    "from torchvision import transforms\n",
    "\n",
    "plt.rcParams['axes.facecolor'] = 'white'\n",
    "plt.rcParams['figure.figsize'] = 9, 6"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1087,
   "metadata": {
    "executionInfo": {
     "elapsed": 6,
     "status": "ok",
     "timestamp": 1694139355797,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "CKgWca6rEXRj"
   },
   "outputs": [],
   "source": [
    "%matplotlib inline\n",
    "\n",
    "# importing relevant libraries\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import scipy as sp\n",
    "import matplotlib.pyplot as plt\n",
    "import sklearn\n",
    "from sklearn.ensemble import RandomForestClassifier, ExtraTreesClassifier\n",
    "from sklearn.preprocessing import OneHotEncoder, StandardScaler\n",
    "from sklearn.model_selection import cross_val_predict, StratifiedKFold\n",
    "from sklearn.metrics import roc_auc_score, average_precision_score, precision_recall_curve, auc#plot_precision_recall_curve\n",
    "from sklearn.datasets import make_classification\n",
    "from sklearn.preprocessing import MinMaxScaler\n",
    "from tqdm import tqdm\n",
    "from umap import UMAP\n",
    "from pynndescent import NNDescent\n",
    "from fastcluster import single\n",
    "from scipy.cluster.hierarchy import cut_tree, fcluster, dendrogram\n",
    "from scipy.spatial.distance import squareform\n",
    "from sklearn.tree import DecisionTreeClassifier, ExtraTreeClassifier\n",
    "from pims import ImageSequence\n",
    "from PIL import Image\n",
    "from scipy.spatial.distance import hamming\n",
    "import warnings\n",
    "warnings.filterwarnings('ignore')\n",
    "\n",
    "# turning off automatic plot showing, and setting style\n",
    "plt.style.use('bmh')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 988,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 14,
     "status": "ok",
     "timestamp": 1694122502401,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "8iNq7_xZ6WJK",
    "outputId": "197dcf3a-52d1-4d42-ac43-e03c5e653d29"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cpu\n"
     ]
    }
   ],
   "source": [
    "if torch.cuda.is_available():\n",
    "    device = torch.device('cuda')\n",
    "else:\n",
    "    device = torch.device('cpu')\n",
    "\n",
    "print(device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 989,
   "metadata": {
    "executionInfo": {
     "elapsed": 6,
     "status": "ok",
     "timestamp": 1694122502401,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "HrjCzoe8OWqH"
   },
   "outputs": [],
   "source": [
    "# define the NN architecture\n",
    "class ConvAutoencoder(nn.Module):\n",
    "    def __init__(self):\n",
    "        super(ConvAutoencoder, self).__init__()\n",
    "        ## encoder layers ##\n",
    "        # conv layer (depth from 1 --> 16), 3x3 kernels\n",
    "        self.conv1 = nn.Conv2d(1, 16, 3, padding=1)\n",
    "        # conv layer (depth from 16 --> 4), 3x3 kernels\n",
    "        self.conv2 = nn.Conv2d(16, 4, 3, padding=1)\n",
    "        # pooling layer to reduce x-y dims by two; kernel and stride of 2\n",
    "        self.pool = nn.MaxPool2d(2, 2)\n",
    "\n",
    "        ## decoder layers ##\n",
    "        ## a kernel of 2 and a stride of 2 will increase the spatial dims by 2\n",
    "        self.t_conv1 = nn.ConvTranspose2d(4, 16, 2, stride=2)\n",
    "        self.t_conv2 = nn.ConvTranspose2d(16, 1, 2, stride=2)\n",
    "\n",
    "\n",
    "    def forward(self, x):\n",
    "        ## encode ##\n",
    "        # add hidden layers with relu activation function\n",
    "        # and maxpooling after\n",
    "        x = F.relu(self.conv1(x))\n",
    "        x = self.pool(x)\n",
    "        # add second hidden layer\n",
    "        x = F.relu(self.conv2(x))\n",
    "        x = self.pool(x)  # compressed representation\n",
    "\n",
    "        ## decode ##\n",
    "        # add transpose conv layers, with relu activation function\n",
    "        x = F.relu(self.t_conv1(x))\n",
    "        # output layer (with sigmoid for scaling from 0 to 1)\n",
    "        x = F.sigmoid(self.t_conv2(x))\n",
    "\n",
    "        return x\n",
    "\n",
    "    def forward_encoder(self, x):\n",
    "        x = F.relu(self.conv1(x))\n",
    "        x = self.pool(x)\n",
    "        # add second hidden layer\n",
    "        x = F.relu(self.conv2(x))\n",
    "        x = self.pool(x)  # compressed representation\n",
    "\n",
    "        return x\n",
    "\n",
    "\n",
    "# Training function\n",
    "def train(model, train_loader, criterion, optimizer, num_epochs=10, online = False):\n",
    "    model.train()\n",
    "    for epoch in range(num_epochs):\n",
    "        running_loss = 0.0\n",
    "        if not online:\n",
    "            for images in train_loader:\n",
    "                noisy_images = images #+ torch.randn(images.size()) * 0.1  # Adding Gaussian noise\n",
    "                noisy_images = torchvision.transforms.Grayscale(num_output_channels=1)(noisy_images)\n",
    "                optimizer.zero_grad()\n",
    "                outputs = model(noisy_images)\n",
    "                loss = criterion(outputs, images)\n",
    "                loss.backward()\n",
    "                optimizer.step()\n",
    "                running_loss += loss.item()\n",
    "        else:\n",
    "            for images, _ in train_loader:\n",
    "                noisy_images = images #+ torch.randn(images.size()) * 0.1  # Adding Gaussian noise\n",
    "                noisy_images = torchvision.transforms.Grayscale(num_output_channels=1)(noisy_images)\n",
    "                optimizer.zero_grad()\n",
    "                outputs = model(noisy_images)\n",
    "                loss = criterion(outputs, images)\n",
    "                loss.backward()\n",
    "                optimizer.step()\n",
    "                running_loss += loss.item()\n",
    "        print(f\"Epoch [{epoch + 1}/{num_epochs}], Loss: {running_loss / len(train_loader)}\")\n",
    "\n",
    "# Data preprocessing\n",
    "transform = transforms.Compose([\n",
    "    transforms.ToTensor(),\n",
    "])\n",
    "\n",
    "# Initialize the model, criterion, and optimizer\n",
    "model = ConvAutoencoder()\n",
    "criterion = nn.MSELoss()\n",
    "optimizer = torch.optim.Adam(model.parameters(), lr=0.001)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 990,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 591166,
     "status": "ok",
     "timestamp": 1694123093561,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Om9z7Bi4O-sW",
    "outputId": "16725f15-f047-48a1-c7a8-21a10e35efaf"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch [1/30], Loss: 0.03456441803114501\n",
      "Epoch [2/30], Loss: 0.015335978169653462\n",
      "Epoch [3/30], Loss: 0.01431086510499276\n",
      "Epoch [4/30], Loss: 0.01361127900205918\n",
      "Epoch [5/30], Loss: 0.013123237304508623\n",
      "Epoch [6/30], Loss: 0.012749999074507624\n",
      "Epoch [7/30], Loss: 0.012421703745505766\n",
      "Epoch [8/30], Loss: 0.012119799774926481\n",
      "Epoch [9/30], Loss: 0.011838643721290934\n",
      "Epoch [10/30], Loss: 0.01165153897766556\n",
      "Epoch [11/30], Loss: 0.011503737467501971\n",
      "Epoch [12/30], Loss: 0.01137899024896562\n",
      "Epoch [13/30], Loss: 0.011199908384652154\n",
      "Epoch [14/30], Loss: 0.01105614403274649\n",
      "Epoch [15/30], Loss: 0.010939428055567591\n",
      "Epoch [16/30], Loss: 0.010819886036630252\n",
      "Epoch [17/30], Loss: 0.010716436698889808\n",
      "Epoch [18/30], Loss: 0.010621629811243526\n",
      "Epoch [19/30], Loss: 0.01052907568865271\n",
      "Epoch [20/30], Loss: 0.010441198085210344\n",
      "Epoch [21/30], Loss: 0.010371393659142162\n",
      "Epoch [22/30], Loss: 0.010319650055034392\n",
      "Epoch [23/30], Loss: 0.010271423975867567\n",
      "Epoch [24/30], Loss: 0.010224905479619942\n",
      "Epoch [25/30], Loss: 0.010190062296352408\n",
      "Epoch [26/30], Loss: 0.01015135308584647\n",
      "Epoch [27/30], Loss: 0.010117423250528572\n",
      "Epoch [28/30], Loss: 0.010087443005317437\n",
      "Epoch [29/30], Loss: 0.010053345408322397\n",
      "Epoch [30/30], Loss: 0.010026184544126108\n"
     ]
    }
   ],
   "source": [
    "# Load CIFAR-10 data\n",
    "train_dataset = torchvision.datasets.MNIST(root=\".MNIST/train\", train=True, transform=transform, download=True)\n",
    "train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=64, shuffle=True, num_workers=4)\n",
    "\n",
    "# Training the model\n",
    "train(model, train_loader, criterion, optimizer, num_epochs=30, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 991,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 26874,
     "status": "ok",
     "timestamp": 1694123120414,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "bh3Zu2QWO-uq",
    "outputId": "b0ab4a7f-2a9b-4796-9530-3d102dc798f6"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'torchvision.datasets.mnist.MNIST'>\n",
      "[9 3 6 ... 3 1 0]\n",
      "(60000, 1, 28, 28)\n",
      "(60000, 4, 7, 7)\n",
      "(60000,)\n"
     ]
    }
   ],
   "source": [
    "train_dataset = torchvision.datasets.MNIST(root=\".MNIST/train\", train=True, transform=transform, download=True)\n",
    "train_loader = torch.utils.data.DataLoader(train_dataset, batch_size = 60000, shuffle=True)\n",
    "\n",
    "print(type(train_dataset))\n",
    "\n",
    "for batch in train_loader:\n",
    "    img, labels = batch\n",
    "    #img = img.reshape(-1, 28*28)\n",
    "\n",
    "    # Generating output\n",
    "    out = model.forward(img)\n",
    "    latent_train = model.forward_encoder(img)\n",
    "\n",
    "X_train = img.detach().numpy()\n",
    "latent_train = latent_train.detach().numpy()\n",
    "y = labels.detach().numpy()\n",
    "print(y)\n",
    "print(X_train.shape)\n",
    "print(latent_train.shape)\n",
    "print(y.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 992,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1076,
     "status": "ok",
     "timestamp": 1694123121462,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "ssO_Le6NP6HZ",
    "outputId": "dce48624-169c-41df-8c00-2dbb8d62da83"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(60000, 784)\n",
      "(60000, 196)\n",
      "0.0018747908346718198\n",
      "0.0021766304922793598\n"
     ]
    }
   ],
   "source": [
    "X_train = X_train.reshape(-1,28*28)\n",
    "latent_train = latent_train.reshape(-1,4*7*7)\n",
    "print(X_train.shape)\n",
    "print(latent_train.shape)\n",
    "print(np.mean(np.cov(X_train.T)))\n",
    "print(np.mean(np.cov(latent_train.T)))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 995,
   "metadata": {
    "executionInfo": {
     "elapsed": 5,
     "status": "ok",
     "timestamp": 1694123227390,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "fw90altp9HQr"
   },
   "outputs": [],
   "source": [
    "# y = y[:2400]\n",
    "# latent_train = latent_train[:2400,:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 996,
   "metadata": {
    "executionInfo": {
     "elapsed": 6,
     "status": "ok",
     "timestamp": 1694123227391,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "W_x-D1GZD-XN"
   },
   "outputs": [],
   "source": [
    "# np.random.shuffle(y)\n",
    "# print(y)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "k3hp5R2cQCD9"
   },
   "source": [
    "# Tree Model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 997,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 39070,
     "status": "ok",
     "timestamp": 1694123266456,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "R3tnvjyuQKpq",
    "outputId": "1112978d-1748-4f3f-c8e9-04a94a2742a7"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Area under the ROC Curve: 0.9923137003638487\n"
     ]
    }
   ],
   "source": [
    "et = ExtraTreesClassifier(n_estimators=500, min_samples_leaf=100,\n",
    "                          max_features='sqrt', bootstrap=True, class_weight='balanced', n_jobs=-1)\n",
    "\n",
    "# et = RandomForestClassifier(n_estimators=500, min_samples_leaf=100,\n",
    "#                           max_features='sqrt', bootstrap=True, class_weight='balanced', n_jobs=-1)\n",
    "\n",
    "# validation instance\n",
    "skf = StratifiedKFold(n_splits=5, shuffle=True)\n",
    "\n",
    "# getting the model validation predictions\n",
    "preds = cross_val_predict(et, latent_train, y, cv=skf, method='predict_proba')\n",
    "\n",
    "# evaluating the model\n",
    "print('Area under the ROC Curve:', roc_auc_score(y, preds, multi_class='ovo'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 998,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 92
    },
    "executionInfo": {
     "elapsed": 9442,
     "status": "ok",
     "timestamp": 1694123275885,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "T2zHZflUQlOr",
    "outputId": "0a3e8197-9764-41e7-b80e-5c7e1061ba07"
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<style>#sk-container-id-11 {color: black;background-color: white;}#sk-container-id-11 pre{padding: 0;}#sk-container-id-11 div.sk-toggleable {background-color: white;}#sk-container-id-11 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-11 label.sk-toggleable__label-arrow:before {content: \"▸\";float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-11 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-11 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-11 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-11 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-11 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-11 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content: \"▾\";}#sk-container-id-11 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-11 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-11 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-11 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-11 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-11 div.sk-parallel-item::after {content: \"\";width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-11 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-11 div.sk-serial::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-11 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-11 div.sk-item {position: relative;z-index: 1;}#sk-container-id-11 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-11 div.sk-item::before, #sk-container-id-11 div.sk-parallel-item::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-11 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-11 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-11 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-11 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-11 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-11 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-11 div.sk-label-container {text-align: center;}#sk-container-id-11 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-11 div.sk-text-repr-fallback {display: none;}</style><div id=\"sk-container-id-11\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>ExtraTreesClassifier(bootstrap=True, class_weight=&#x27;balanced&#x27;,\n",
       "                     min_samples_leaf=100, n_estimators=500, n_jobs=-1)</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-11\" type=\"checkbox\" checked><label for=\"sk-estimator-id-11\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">ExtraTreesClassifier</label><div class=\"sk-toggleable__content\"><pre>ExtraTreesClassifier(bootstrap=True, class_weight=&#x27;balanced&#x27;,\n",
       "                     min_samples_leaf=100, n_estimators=500, n_jobs=-1)</pre></div></div></div></div></div>"
      ],
      "text/plain": [
       "ExtraTreesClassifier(bootstrap=True, class_weight='balanced',\n",
       "                     min_samples_leaf=100, n_estimators=500, n_jobs=-1)"
      ]
     },
     "execution_count": 998,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "et.fit(latent_train,y)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 999,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5069,
     "status": "ok",
     "timestamp": 1694123280951,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "6tMnYzZ_VPZR",
    "outputId": "932fc984-2dcd-45d7-e38b-89a2dcfe607e"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(60000, 500)\n",
      "[[409  73  88 ... 196 183 386]\n",
      " [ 64 123 299 ... 148  74 241]\n",
      " [341  25  53 ... 343 253 421]\n",
      " ...\n",
      " [ 61  20 398 ... 219 268 330]\n",
      " [ 53 399 397 ...  36 267 319]\n",
      " [457  70 346 ... 232 140  51]]\n",
      "0.9944923126252497\n",
      "1.928843430307384e-06\n"
     ]
    }
   ],
   "source": [
    "leaves_train = et.apply(latent_train)\n",
    "print(leaves_train.shape)\n",
    "print(leaves_train)\n",
    "\n",
    "distances_train = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_train[i,j] = hamming(leaves_train[i,:], leaves_train[j,:])\n",
    "\n",
    "score_train = sum(distances_train)/499\n",
    "\n",
    "print(np.mean(score_train))\n",
    "print(np.cov(score_train))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1000,
   "metadata": {
    "executionInfo": {
     "elapsed": 19,
     "status": "ok",
     "timestamp": 1694123280951,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Q55SNuDNhQQ1"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# torch.save(model.state_dict(), path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1001,
   "metadata": {
    "executionInfo": {
     "elapsed": 18,
     "status": "ok",
     "timestamp": 1694123280951,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "0hpY3jsdhQUb"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "U6SnpaEVWOQf"
   },
   "source": [
    "# Testing on ID Data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1002,
   "metadata": {
    "executionInfo": {
     "elapsed": 19,
     "status": "ok",
     "timestamp": 1694123280952,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "R6olj5rRmTpo"
   },
   "outputs": [],
   "source": [
    "#num_epoch = 30"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1003,
   "metadata": {
    "executionInfo": {
     "elapsed": 18,
     "status": "ok",
     "timestamp": 1694123280952,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "BLgLZ7STVPbU"
   },
   "outputs": [],
   "source": [
    "# test_dataset_MNIST = torchvision.datasets.MNIST(root=\".MNIST/test\", train=False, transform=transform, download=True)\n",
    "# test_loader_MNIST = torch.utils.data.DataLoader(test_dataset_MNIST, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_MNIST, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1004,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5803,
     "status": "ok",
     "timestamp": 1694123286737,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "zM65LrAhVPda",
    "outputId": "7c251394-f897-4c38-8d89-7e1a711f3b69"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 1, 28, 28)\n",
      "(10000, 4, 7, 7)\n",
      "(10000, 784)\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "test_dataset_MNIST = torchvision.datasets.MNIST(root=\".MNIST/test\", train=False, transform=transform, download=True)\n",
    "test_loader_MNIST = torch.utils.data.DataLoader(test_dataset_MNIST, batch_size = 10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_MNIST:\n",
    "    img, _ = batch\n",
    "    #img = torchvision.transforms.Grayscale(num_output_channels=1)(img)\n",
    "    #img = img.reshape(-1, 28*28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test = latent_test.detach().numpy()\n",
    "X_test = img.detach().numpy()\n",
    "print(X_test.shape)\n",
    "print(latent_test.shape)\n",
    "X_test = X_test.reshape(-1,1*28*28)\n",
    "latent_test = latent_test.reshape(-1,4*7*7)\n",
    "print(X_test.shape)\n",
    "print(latent_test.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1005,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4300,
     "status": "ok",
     "timestamp": 1694123291023,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "5l77BQBXVPfP",
    "outputId": "d54fe515-f2f4-4464-fb73-33ea61c964fa"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[ 30  31  34 ...  50 110   7]\n",
      " [246   8  34 ...   7   4 111]\n",
      " [246   8  59 ...  52  16 111]\n",
      " ...\n",
      " [ 30  60 279 ...  70  87  15]\n",
      " [246   8  59 ...   7 216 168]\n",
      " [246  61 265 ...  88 158 241]]\n",
      "0.9471780040080169\n",
      "0.00018871546034637847\n"
     ]
    }
   ],
   "source": [
    "latent_test_in = latent_test\n",
    "\n",
    "leaves_test_in = et.apply(latent_test_in)\n",
    "print(leaves_test_in.shape)\n",
    "print(leaves_test_in)\n",
    "\n",
    "distances_test_in = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_in[i,j] = hamming(leaves_test_in[i,:], leaves_test_in[j,:])\n",
    "\n",
    "score_test_in = sum(distances_test_in)/499\n",
    "print(np.mean(score_test_in))\n",
    "print(np.cov(score_test_in))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "zKHeKNSXWZQr"
   },
   "source": [
    "# Testing on OOD Data"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "DQgAh1gaXxP6"
   },
   "source": [
    "## FashionMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1006,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123291024,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "DTO-dHR3hkcS"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1007,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 632,
     "status": "ok",
     "timestamp": 1694123291635,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "U6-VmvGdWLPA",
    "outputId": "270720cf-0c28-4a0f-f10e-4c96678525d5"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 1, 28, 28)\n"
     ]
    }
   ],
   "source": [
    "df_test_out = pd.read_csv('/content/gdrive/MyDrive/TOOD/datasets/fashion-mnist_test.csv')\n",
    "data_test_out = np.array(df_test_out)\n",
    "\n",
    "X_test_out = data_test_out[:, 1:785]/255\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "print(X_test_out.shape)\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Fashion = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Fashion, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1008,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 3788,
     "status": "ok",
     "timestamp": 1694123295420,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "G-T51piGWLRU",
    "outputId": "07c65eb8-697f-4096-d989-11008fe813ef"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 4, 7, 7)\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Fashion = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Fashion:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Fashion = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Fashion.shape)\n",
    "latent_test_out_Fashion = latent_test_out_Fashion.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Fashion.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1009,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4321,
     "status": "ok",
     "timestamp": 1694123299720,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "RMYCE2rXYeqT",
    "outputId": "9465bb29-48e6-4d56-c41a-a9b11f72712c"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[100  15 264 ... 171 190 241]\n",
      " [100   8 128 ... 196 171   4]\n",
      " [100   8 264 ... 112  87 241]\n",
      " ...\n",
      " [110 196 140 ... 293  87 299]\n",
      " [100   8 178 ... 105  87 111]\n",
      " [ 38   8 159 ... 242 118 111]]\n",
      "0.89349619238477\n",
      "0.0018301517199724277\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Fashion = et.apply(latent_test_out_Fashion)\n",
    "\n",
    "print(leaves_test_out_Fashion.shape)\n",
    "print(leaves_test_out_Fashion)\n",
    "\n",
    "distances_test_out_Fashion = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Fashion[i,j] = hamming(leaves_test_out_Fashion[i,:], leaves_test_out_Fashion[j,:])\n",
    "\n",
    "score_test_out_Fashion = sum(distances_test_out_Fashion)/499\n",
    "\n",
    "print(np.mean(score_test_out_Fashion))\n",
    "print(np.cov(score_test_out_Fashion))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "3sbvCh5uLVF8"
   },
   "source": [
    "## BreastMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1010,
   "metadata": {
    "executionInfo": {
     "elapsed": 28,
     "status": "ok",
     "timestamp": 1694123299721,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "xH7FHZucLXof"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1011,
   "metadata": {
    "executionInfo": {
     "elapsed": 28,
     "status": "ok",
     "timestamp": 1694123299722,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "NPSj7LA5LcX1"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/breastmnist.npz')\n",
    "#X_test_out = df['test_images']/255\n",
    "[size, _, _] = df['train_images'].shape\n",
    "X_test_out = df['train_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_ChestMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_ChestMNIST, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1012,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 28,
     "status": "ok",
     "timestamp": 1694123299722,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "TlTGVy9BLcZ4",
    "outputId": "503cdd88-775e-46c2-cac7-bffa5bcab243"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "546\n",
      "(546, 4, 7, 7)\n",
      "(546, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['train_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_BreastMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_BreastMNIST:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Breast = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Breast.shape)\n",
    "latent_test_out_Breast = latent_test_out_Breast.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Breast.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1013,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4303,
     "status": "ok",
     "timestamp": 1694123304001,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "AwnfD_3CLcb7",
    "outputId": "17e48c28-e7ba-4b4a-c613-e42399447222"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(546, 500)\n",
      "[[100 117 211 ... 280 180 289]\n",
      " [212 239  53 ... 283 179 404]\n",
      " [326 239 211 ... 256 367 404]\n",
      " ...\n",
      " [461 239  53 ... 256 362 404]\n",
      " [284 144 211 ... 283 179 394]\n",
      " [110 200 205 ... 283 227 289]]\n",
      "0.7313129939879759\n",
      "0.0029484822333376596\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Breast = et.apply(latent_test_out_Breast)\n",
    "\n",
    "print(leaves_test_out_Breast.shape)\n",
    "print(leaves_test_out_Breast)\n",
    "\n",
    "distances_test_out_Breast = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Breast[i,j] = hamming(leaves_test_out_Breast[i,:], leaves_test_out_Breast[j,:])\n",
    "\n",
    "score_test_out_Breast = sum(distances_test_out_Breast)/499\n",
    "\n",
    "print(np.mean(score_test_out_Breast))\n",
    "print(np.cov(score_test_out_Breast))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1013,
   "metadata": {
    "executionInfo": {
     "elapsed": 13,
     "status": "ok",
     "timestamp": 1694123304002,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "bsj9NUx3LXq0"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "1vkCzIAMy5Yi"
   },
   "source": [
    "## ChestMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1014,
   "metadata": {
    "executionInfo": {
     "elapsed": 12,
     "status": "ok",
     "timestamp": 1694123304002,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "-I7QZNVUhnpI"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1015,
   "metadata": {
    "executionInfo": {
     "elapsed": 461,
     "status": "ok",
     "timestamp": 1694123304451,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "3Nh3znXBv1za"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/chestmnist.npz')\n",
    "#X_test_out = df['test_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_ChestMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_ChestMNIST, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1016,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 8030,
     "status": "ok",
     "timestamp": 1694123312479,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "FFfdi--zv12B",
    "outputId": "8dbb653b-dc95-43a3-a9f4-02556de0b313"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "22433\n",
      "(22433, 4, 7, 7)\n",
      "(22433, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_ChestMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_ChestMNIST:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Chest = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Chest.shape)\n",
    "latent_test_out_Chest = latent_test_out_Chest.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Chest.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1017,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4480,
     "status": "ok",
     "timestamp": 1694123316941,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "hLfKbVMzzxUi",
    "outputId": "fb2d0b2d-63bc-4c0b-9dab-c19bf74f3e11"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(22433, 500)\n",
      "[[176 452 205 ... 293 227 289]\n",
      " [176  54 205 ... 293 208 289]\n",
      " [177  54 159 ... 293 209 286]\n",
      " ...\n",
      " [177 436 178 ... 243 227 374]\n",
      " [176 437 178 ... 293 227 352]\n",
      " [176 452 205 ... 293 227 286]]\n",
      "0.6373530581162324\n",
      "0.0022009263155248694\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Chest = et.apply(latent_test_out_Chest)\n",
    "\n",
    "print(leaves_test_out_Chest.shape)\n",
    "print(leaves_test_out_Chest)\n",
    "\n",
    "distances_test_out_Chest = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Chest[i,j] = hamming(leaves_test_out_Chest[i,:], leaves_test_out_Chest[j,:])\n",
    "\n",
    "score_test_out_Chest = sum(distances_test_out_Chest)/499\n",
    "\n",
    "print(np.mean(score_test_out_Chest))\n",
    "print(np.cov(score_test_out_Chest))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "Z7xvIZvWMO-t"
   },
   "source": [
    "## OctMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1018,
   "metadata": {
    "executionInfo": {
     "elapsed": 26,
     "status": "ok",
     "timestamp": 1694123316942,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "ZXOIXhMFMUEO"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1019,
   "metadata": {
    "executionInfo": {
     "elapsed": 25,
     "status": "ok",
     "timestamp": 1694123316942,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "9WyQFN4SMUGT"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/octmnist.npz')\n",
    "#X_test_out = df['test_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_ChestMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_ChestMNIST, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1020,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 328,
     "status": "ok",
     "timestamp": 1694123317246,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "twgmrsCUMUIH",
    "outputId": "5c4c09cf-2be0-4d88-cc67-75666761341e"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1000\n",
      "(1000, 4, 7, 7)\n",
      "(1000, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_OctMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_OctMNIST:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Oct = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Oct.shape)\n",
    "latent_test_out_Oct = latent_test_out_Oct.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Oct.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1021,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4763,
     "status": "ok",
     "timestamp": 1694123322008,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "JNTwND7cMUKG",
    "outputId": "5eafe1e2-20cc-4611-fe9e-3108aeb97da4"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(1000, 500)\n",
      "[[463 239  53 ... 256 396 404]\n",
      " [326 447  53 ... 289 437 405]\n",
      " [457 239  53 ... 257 362 404]\n",
      " ...\n",
      " [378 452 211 ... 339 227 404]\n",
      " [461 239  53 ... 257 362 404]\n",
      " [457 452  53 ... 257 386 404]]\n",
      "0.6319768336673346\n",
      "0.0058429905862399335\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Oct = et.apply(latent_test_out_Oct)\n",
    "\n",
    "print(leaves_test_out_Oct.shape)\n",
    "print(leaves_test_out_Oct)\n",
    "\n",
    "distances_test_out_Oct = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Oct[i,j] = hamming(leaves_test_out_Oct[i,:], leaves_test_out_Oct[j,:])\n",
    "\n",
    "score_test_out_Oct = sum(distances_test_out_Oct)/499\n",
    "\n",
    "print(np.mean(score_test_out_Oct))\n",
    "print(np.cov(score_test_out_Oct))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "_Tguoeb3Nosv"
   },
   "source": [
    "## PneumMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1022,
   "metadata": {
    "executionInfo": {
     "elapsed": 13,
     "status": "ok",
     "timestamp": 1694123322009,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "yhageUDChpGt"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1023,
   "metadata": {
    "executionInfo": {
     "elapsed": 13,
     "status": "ok",
     "timestamp": 1694123322009,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "SJN2w-zVzxWm"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/pneumoniamnist.npz')\n",
    "#X_test_out = df['train_images']/255\n",
    "[size, _, _] = df['train_images'].shape\n",
    "X_test_out = df['train_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Pneum = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Pneum, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1024,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1409,
     "status": "ok",
     "timestamp": 1694123323405,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "zmGFQYZvNtiL",
    "outputId": "7c8b0db4-1868-44ae-9290-cc3af5fe6cac"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "4708\n",
      "(4708, 4, 7, 7)\n",
      "(4708, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['train_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Pneum = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Pneum:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Pneum = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Pneum.shape)\n",
    "latent_test_out_Pneum = latent_test_out_Pneum.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Pneum.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1025,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4194,
     "status": "ok",
     "timestamp": 1694123327594,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "9SuNE4aSNt7b",
    "outputId": "19e92bb5-a3ae-4195-b38e-16e7807c5dac"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(4708, 500)\n",
      "[[100  15 159 ... 293  87 289]\n",
      " [177  54 159 ... 293 171 286]\n",
      " [100  15 159 ... 293 180 289]\n",
      " ...\n",
      " [100  15 159 ... 293 180 289]\n",
      " [100   8 159 ... 293  87 289]\n",
      " [100  15 159 ... 112  87   4]]\n",
      "0.5854379318637275\n",
      "0.003699191219194934\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Pneum = et.apply(latent_test_out_Pneum)\n",
    "\n",
    "print(leaves_test_out_Pneum.shape)\n",
    "print(leaves_test_out_Pneum)\n",
    "\n",
    "distances_test_out_Pneum = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Pneum[i,j] = hamming(leaves_test_out_Pneum[i,:], leaves_test_out_Pneum[j,:])\n",
    "\n",
    "score_test_out_Pneum = sum(distances_test_out_Pneum)/499\n",
    "\n",
    "print(np.mean(score_test_out_Pneum))\n",
    "print(np.cov(score_test_out_Pneum))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "C7Lo5fFxNkeC"
   },
   "source": [
    "## OrganaMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1026,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123327594,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "y1JVWYobNnXs"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1027,
   "metadata": {
    "executionInfo": {
     "elapsed": 456,
     "status": "ok",
     "timestamp": 1694123328029,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "cHlm9xYvNnbS"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/organamnist.npz')\n",
    "#X_test_out = df['train_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Organc = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Organc, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1028,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 6441,
     "status": "ok",
     "timestamp": 1694123334467,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "-0ODe_SyNneE",
    "outputId": "09f718c6-c054-4668-8843-875209667792"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "17778\n",
      "(17778, 4, 7, 7)\n",
      "(17778, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Organa = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Organa:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Organa = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Organa.shape)\n",
    "latent_test_out_Organa = latent_test_out_Organa.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Organa.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1029,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4285,
     "status": "ok",
     "timestamp": 1694123338730,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "MOFGPtBYNngB",
    "outputId": "9c35ac22-aeb3-4202-ccb6-61a73c2c7e10"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(17778, 500)\n",
      "[[109 198  53 ... 367  24 288]\n",
      " [149  54  58 ... 418  20 288]\n",
      " [246 198 181 ... 293 190 289]\n",
      " ...\n",
      " [100 117 159 ... 369  60   4]\n",
      " [246 151 211 ... 289  87 387]\n",
      " [100 144 205 ... 293 172 387]]\n",
      "0.83064046492986\n",
      "0.0041737427182972795\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Organa = et.apply(latent_test_out_Organa)\n",
    "\n",
    "print(leaves_test_out_Organa.shape)\n",
    "print(leaves_test_out_Organa)\n",
    "\n",
    "distances_test_out_Organa = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Organa[i,j] = hamming(leaves_test_out_Organa[i,:], leaves_test_out_Organa[j,:])\n",
    "\n",
    "score_test_out_Organa = sum(distances_test_out_Organa)/499\n",
    "\n",
    "print(np.mean(score_test_out_Organa))\n",
    "print(np.cov(score_test_out_Organa))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "UEKwndGfCmv6"
   },
   "source": [
    "## OrgancMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1030,
   "metadata": {
    "executionInfo": {
     "elapsed": 16,
     "status": "ok",
     "timestamp": 1694123338731,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "J1GLB1jDh3uE"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1031,
   "metadata": {
    "executionInfo": {
     "elapsed": 16,
     "status": "ok",
     "timestamp": 1694123338731,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "6OlXP64YNuYF"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/organcmnist.npz')\n",
    "#X_test_out = df['train_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Organc = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Organc, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1032,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 2910,
     "status": "ok",
     "timestamp": 1694123341626,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "GneANgXlNuoo",
    "outputId": "46367c90-8e14-419d-ce61-d7f26f09b127"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "8268\n",
      "(8268, 4, 7, 7)\n",
      "(8268, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Organc = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Organc:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Organc = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Organc.shape)\n",
    "latent_test_out_Organc = latent_test_out_Organc.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Organc.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1033,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4162,
     "status": "ok",
     "timestamp": 1694123345772,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "poQYWGAOC5gL",
    "outputId": "bd416b93-f3fd-444c-fe9e-193e72f41344"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(8268, 500)\n",
      "[[100 117 159 ... 105  87   4]\n",
      " [ 30  31 159 ... 283 118 286]\n",
      " [216 452 211 ... 283 324   4]\n",
      " ...\n",
      " [328 151 212 ... 281 200 404]\n",
      " [212 239 211 ... 256 227 288]\n",
      " [110 239 211 ... 283 227 289]]\n",
      "0.8206654909819643\n",
      "0.004101189186206943\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Organc = et.apply(latent_test_out_Organc)\n",
    "\n",
    "print(leaves_test_out_Organc.shape)\n",
    "print(leaves_test_out_Organc)\n",
    "\n",
    "distances_test_out_Organc = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Organc[i,j] = hamming(leaves_test_out_Organc[i,:], leaves_test_out_Organc[j,:])\n",
    "\n",
    "score_test_out_Organc = sum(distances_test_out_Organc)/499\n",
    "\n",
    "print(np.mean(score_test_out_Organc))\n",
    "print(np.cov(score_test_out_Organc))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "I4J8ADHIOI1l"
   },
   "source": [
    "## OrgansMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1034,
   "metadata": {
    "executionInfo": {
     "elapsed": 8,
     "status": "ok",
     "timestamp": 1694123345773,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Z9oI4sJpOL2y"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1035,
   "metadata": {
    "executionInfo": {
     "elapsed": 6,
     "status": "ok",
     "timestamp": 1694123345773,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Y9Wd57elOMA6"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/organsmnist.npz')\n",
    "#X_test_out = df['train_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Organc = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Organc, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1036,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 3075,
     "status": "ok",
     "timestamp": 1694123348843,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "r2zIds3qOMDY",
    "outputId": "adf268f3-bcce-401e-d19e-97afa515b4b8"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "8829\n",
      "(8829, 4, 7, 7)\n",
      "(8829, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Organs = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Organs:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Organs = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Organs.shape)\n",
    "latent_test_out_Organs = latent_test_out_Organs.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Organs.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1037,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4422,
     "status": "ok",
     "timestamp": 1694123353243,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "S--_kE0yOMOV",
    "outputId": "5ca9a1cb-fe6b-40e6-a429-7236cd57318e"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(8829, 500)\n",
      "[[ 37  15 159 ... 112  87 289]\n",
      " [ 10  31 159 ... 105  87   4]\n",
      " [ 36 452 205 ... 293  87   4]\n",
      " ...\n",
      " [ 37 117 159 ... 105 118 289]\n",
      " [100 239 211 ... 283 227 289]\n",
      " [100 198 211 ... 293 180 289]]\n",
      "0.8312460280561125\n",
      "0.0040789310167525005\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Organs = et.apply(latent_test_out_Organs)\n",
    "\n",
    "print(leaves_test_out_Organs.shape)\n",
    "print(leaves_test_out_Organs)\n",
    "\n",
    "distances_test_out_Organs = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Organs[i,j] = hamming(leaves_test_out_Organs[i,:], leaves_test_out_Organs[j,:])\n",
    "\n",
    "score_test_out_Organs = sum(distances_test_out_Organs)/499\n",
    "\n",
    "print(np.mean(score_test_out_Organs))\n",
    "print(np.cov(score_test_out_Organs))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "PK_cY3XVDxlQ"
   },
   "source": [
    "## TissueMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1038,
   "metadata": {
    "executionInfo": {
     "elapsed": 17,
     "status": "ok",
     "timestamp": 1694123353244,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "rXhtk9Mah8mR"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1039,
   "metadata": {
    "executionInfo": {
     "elapsed": 926,
     "status": "ok",
     "timestamp": 1694123354154,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "ViCtSF5iC5ie"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/tissuemnist.npz')\n",
    "#X_test_out = df['test_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Tissue = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Tissue, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1040,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 15499,
     "status": "ok",
     "timestamp": 1694123369652,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "iSIHWqqOC5kT",
    "outputId": "4def9c2b-3e7a-4727-c96b-e9d4c3712bb3"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "47280\n",
      "(47280, 4, 7, 7)\n",
      "(47280, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Tissue = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Tissue:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Tissue = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Tissue.shape)\n",
    "latent_test_out_Tissue = latent_test_out_Tissue.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Tissue.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1041,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5193,
     "status": "ok",
     "timestamp": 1694123374820,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "IUQ3nT57Egcv",
    "outputId": "a8423d8d-7033-4009-d710-ec4318e79e92"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(47280, 500)\n",
      "[[379 447  59 ... 257 367 390]\n",
      " [198 452 211 ... 334 227 288]\n",
      " [379 452  53 ... 257 362 404]\n",
      " ...\n",
      " [463 200 211 ... 257 227 390]\n",
      " [461 452  53 ... 339 362 404]\n",
      " [461 239  53 ... 257 362 404]]\n",
      "0.6040701563126253\n",
      "0.00738135287517109\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Tissue = et.apply(latent_test_out_Tissue)\n",
    "\n",
    "print(leaves_test_out_Tissue.shape)\n",
    "print(leaves_test_out_Tissue)\n",
    "\n",
    "distances_test_out_Tissue = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Tissue[i,j] = hamming(leaves_test_out_Tissue[i,:], leaves_test_out_Tissue[j,:])\n",
    "\n",
    "score_test_out_Tissue = sum(distances_test_out_Tissue)/499\n",
    "\n",
    "print(np.mean(score_test_out_Tissue))\n",
    "print(np.cov(score_test_out_Tissue))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "V9pDbbT2Q9xv"
   },
   "source": [
    "## KMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1042,
   "metadata": {
    "executionInfo": {
     "elapsed": 28,
     "status": "ok",
     "timestamp": 1694123374821,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "e7-UM77Fh-w-"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1043,
   "metadata": {
    "executionInfo": {
     "elapsed": 30,
     "status": "ok",
     "timestamp": 1694123374826,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "4BiRKanXxvFv"
   },
   "outputs": [],
   "source": [
    "# test_dataset_KMNIST = torchvision.datasets.KMNIST(root=\"./data\", train=False, transform=transform, download=True)\n",
    "# test_loader_KMNIST = torch.utils.data.DataLoader(test_dataset_KMNIST, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_KMNIST, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1044,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5291,
     "status": "ok",
     "timestamp": 1694123380088,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "IrDPmFlTxvH4",
    "outputId": "1d53b78a-fbc1-433d-fb1e-d1bf22032829"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "transform = transforms.Compose(\n",
    "    [transforms.Resize((28, 28)),  # Resize images to match the size of MNIST\n",
    "     transforms.ToTensor()])\n",
    "\n",
    "test_dataset_KMNIST = torchvision.datasets.KMNIST(root='./data', train=False, download=True, transform=transform)\n",
    "test_loader_KMNIST = torch.utils.data.DataLoader(test_dataset_KMNIST, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_KMNIST:\n",
    "    img, _ = batch\n",
    "    #img = torchvision.transforms.Grayscale(num_output_channels=1)(img)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_KMNIST = latent_test_out.detach().numpy()\n",
    "latent_test_out_KMNIST = latent_test_out_KMNIST.reshape(-1,4*7*7)\n",
    "print(latent_test_out_KMNIST.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1045,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4498,
     "status": "ok",
     "timestamp": 1694123384562,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "WqFrdnepRkI7",
    "outputId": "d8da6eb3-a421-4537-aea0-82957fc8e0bb"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[110  31 125 ... 105 219 240]\n",
      " [215  40 140 ...  10  80   4]\n",
      " [ 31   8 178 ... 326 172   7]\n",
      " ...\n",
      " [121  15 159 ... 243  49 113]\n",
      " [109   8 276 ...  65  99 168]\n",
      " [110   8 163 ...  67  24 382]]\n",
      "0.9500735551102213\n",
      "8.145258493977817e-05\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_KMNIST = et.apply(latent_test_out_KMNIST)\n",
    "\n",
    "print(leaves_test_out_KMNIST.shape)\n",
    "print(leaves_test_out_KMNIST)\n",
    "\n",
    "distances_test_out_KMNIST = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_KMNIST[i,j] = hamming(leaves_test_out_KMNIST[i,:], leaves_test_out_KMNIST[j,:])\n",
    "\n",
    "score_test_out_KMNIST = sum(distances_test_out_KMNIST)/499\n",
    "\n",
    "print(np.mean(score_test_out_KMNIST))\n",
    "print(np.cov(score_test_out_KMNIST))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "brj6eAE_SJn2"
   },
   "source": [
    "## QMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1046,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123384562,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "dIaTRR3kif-b"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1047,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123384563,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "1iG0aHi7xvJH"
   },
   "outputs": [],
   "source": [
    "# test_dataset_QMNIST = torchvision.datasets.QMNIST(root=\"./data\", train=False, transform=transform, download=True)\n",
    "# test_loader_QMNIST = torch.utils.data.DataLoader(test_dataset_QMNIST, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_QMNIST, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1048,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 36049,
     "status": "ok",
     "timestamp": 1694123420590,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "gXmIqYEnSMZs",
    "outputId": "1e103123-9f7f-46d8-8509-0d9c16d0c30e"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "transform = transforms.Compose(\n",
    "    [transforms.Resize((28, 28)),  # Resize images to match the size of MNIST\n",
    "     transforms.ToTensor()])\n",
    "\n",
    "test_dataset_QMNIST = torchvision.datasets.QMNIST(root='./data', train=False, download=True, transform=transform)\n",
    "test_loader_QMNIST = torch.utils.data.DataLoader(test_dataset_QMNIST, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_QMNIST:\n",
    "    img, _ = batch\n",
    "    #img = torchvision.transforms.Grayscale(num_output_channels=1)(img)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_QMNIST = latent_test_out.detach().numpy()\n",
    "latent_test_out_QMNIST = latent_test_out_QMNIST.reshape(-1,4*7*7)\n",
    "print(latent_test_out_QMNIST.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1049,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4635,
     "status": "ok",
     "timestamp": 1694123425199,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "OW51VvQQSMbw",
    "outputId": "7a07db89-e0b5-48c2-a709-99025e9aee00"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[ 22 123 283 ... 120  82   4]\n",
      " [105   8 219 ...  81   7   4]\n",
      " [246   8  28 ...  74  87 111]\n",
      " ...\n",
      " [ 37  31 183 ...  65  87 111]\n",
      " [ 14   8 159 ...  65 140   4]\n",
      " [160  50 256 ...   7  84  15]]\n",
      "0.9467801683366742\n",
      "0.00023753421725554279\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_QMNIST = et.apply(latent_test_out_QMNIST)\n",
    "\n",
    "print(leaves_test_out_QMNIST.shape)\n",
    "print(leaves_test_out_QMNIST)\n",
    "\n",
    "distances_test_out_QMNIST = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_QMNIST[i,j] = hamming(leaves_test_out_QMNIST[i,:], leaves_test_out_QMNIST[j,:])\n",
    "\n",
    "score_test_out_QMNIST = sum(distances_test_out_QMNIST)/499\n",
    "\n",
    "print(np.mean(score_test_out_QMNIST))\n",
    "print(np.cov(score_test_out_QMNIST))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "iKdP-64sRyQ8"
   },
   "source": [
    "## Omniglot"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1050,
   "metadata": {
    "executionInfo": {
     "elapsed": 29,
     "status": "ok",
     "timestamp": 1694123425200,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "GNAQF4F4R9JQ"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1051,
   "metadata": {
    "executionInfo": {
     "elapsed": 28,
     "status": "ok",
     "timestamp": 1694123425200,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "bQdeByYMSFYz"
   },
   "outputs": [],
   "source": [
    "# test_dataset_Omniglot = torchvision.datasets.Omniglot(root='./data', download=True, transform=transform)\n",
    "# test_loader_Omniglot = torch.utils.data.DataLoader(test_dataset_QMNIST, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Omniglot, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1052,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 15547,
     "status": "ok",
     "timestamp": 1694123440721,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "rOznxhcjSMd0",
    "outputId": "ea455467-5d9c-431e-cacc-f68c75788f7b"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Files already downloaded and verified\n",
      "(19280, 196)\n"
     ]
    }
   ],
   "source": [
    "transform = transforms.Compose(\n",
    "    [transforms.Resize((28, 28)),  # Resize images to match the size of MNIST\n",
    "     transforms.ToTensor()])\n",
    "\n",
    "test_dataset_Omniglot = torchvision.datasets.Omniglot(root='./data', download=True, transform=transform)\n",
    "\n",
    "# Creating Dataloaders from the\n",
    "# training and testing dataset\n",
    "test_loader_Omniglot = torch.utils.data.DataLoader(test_dataset_Omniglot, batch_size=32460, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Omniglot:\n",
    "    img, _ = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_Omniglot = latent_test_out.detach().numpy()\n",
    "latent_test_out_Omniglot = latent_test_out_Omniglot.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Omniglot.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1053,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4198,
     "status": "ok",
     "timestamp": 1694123444894,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "2l0MVvcaSMfp",
    "outputId": "4a292208-04c4-48bb-ac86-d61192dbafd4"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(19280, 500)\n",
      "[[ 37   8 159 ... 243  87   4]\n",
      " [165  25 159 ... 293  87 111]\n",
      " [100  31 159 ... 105  87   4]\n",
      " ...\n",
      " [ 10  31 159 ... 105  87   4]\n",
      " [ 10  31 159 ... 243  87   4]\n",
      " [ 10 117 159 ... 105  87   4]]\n",
      "0.45097717034068113\n",
      "0.0026636415938544817\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Omniglot = et.apply(latent_test_out_Omniglot)\n",
    "\n",
    "print(leaves_test_out_Omniglot.shape)\n",
    "print(leaves_test_out_Omniglot)\n",
    "\n",
    "distances_test_out_Omniglot = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Omniglot[i,j] = hamming(leaves_test_out_Omniglot[i,:], leaves_test_out_Omniglot[j,:])\n",
    "\n",
    "score_test_out_Omniglot = sum(distances_test_out_Omniglot)/499\n",
    "\n",
    "print(np.mean(score_test_out_Omniglot))\n",
    "print(np.cov(score_test_out_Omniglot))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "u9OZcvTSXkPh"
   },
   "source": [
    "## Cifar10bw"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1054,
   "metadata": {
    "executionInfo": {
     "elapsed": 23,
     "status": "ok",
     "timestamp": 1694123444895,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "QfMu7Z3kXol1"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1055,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123444895,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Ej9JmeDhX0NG"
   },
   "outputs": [],
   "source": [
    "# test_dataset_Cifar10bw = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform)\n",
    "# test_loader_Cifar10bw = torch.utils.data.DataLoader(test_dataset_Cifar10bw, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Cifar10bw, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1056,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 7346,
     "status": "ok",
     "timestamp": 1694123452220,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "96LUcE1kXon3",
    "outputId": "b7e9d1ce-f421-41b0-e1f1-ae5dd7852504"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Files already downloaded and verified\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "transform = transforms.Compose(\n",
    "    [transforms.Resize((28, 28)),  # Resize images to match the size of MNIST\n",
    "     transforms.ToTensor()])\n",
    "\n",
    "test_dataset_Cifar10bw = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform)\n",
    "\n",
    "# Creating Dataloaders from the\n",
    "# training and testing dataset\n",
    "test_loader_Cifar10bw = torch.utils.data.DataLoader(test_dataset_Cifar10bw, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Cifar10bw:\n",
    "    img, _ = batch\n",
    "    img = torchvision.transforms.Grayscale(num_output_channels=1)(img)\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_Cifar10bw = latent_test_out.detach().numpy()\n",
    "latent_test_out_Cifar10bw = latent_test_out_Cifar10bw.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Cifar10bw.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1057,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4643,
     "status": "ok",
     "timestamp": 1694123456839,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "-9ekzdVoYJIH",
    "outputId": "b600a252-afbb-428c-8179-189c3bb404f1"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[100 452 205 ... 293  87   4]\n",
      " [ 37 452 211 ... 278  87   4]\n",
      " [222 452 211 ... 334 141 111]\n",
      " ...\n",
      " [ 36 117 159 ... 280 428   4]\n",
      " [326 239 159 ... 256 227 394]\n",
      " [313 112 205 ... 293 208 111]]\n",
      "0.7999598076152303\n",
      "0.0016177342717968522\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Cifar10bw = et.apply(latent_test_out_Cifar10bw)\n",
    "\n",
    "print(leaves_test_out_Cifar10bw.shape)\n",
    "print(leaves_test_out_Cifar10bw)\n",
    "\n",
    "distances_test_out_Cifar10bw = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Cifar10bw[i,j] = hamming(leaves_test_out_Cifar10bw[i,:], leaves_test_out_Cifar10bw[j,:])\n",
    "\n",
    "score_test_out_Cifar10bw = sum(distances_test_out_Cifar10bw)/499\n",
    "\n",
    "print(np.mean(score_test_out_Cifar10bw))\n",
    "print(np.cov(score_test_out_Cifar10bw))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "WDCNJ2thdelj"
   },
   "source": [
    "## NotMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1058,
   "metadata": {
    "executionInfo": {
     "elapsed": 26,
     "status": "ok",
     "timestamp": 1694123456840,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "hhMEPlqad6cl"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1059,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1746,
     "status": "ok",
     "timestamp": 1694123458562,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "7HUmXsizdh0T",
    "outputId": "87fa8495-266f-47b5-bbd7-a692955853bd"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(500, 1, 28, 28)\n"
     ]
    }
   ],
   "source": [
    "from pims import ImageSequence\n",
    "from PIL import Image\n",
    "\n",
    "images_A = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/A/*.png')\n",
    "images_B = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/B/*.png')\n",
    "images_C = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/C/*.png')\n",
    "images_D = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/D/*.png')\n",
    "images_E = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/E/*.png')\n",
    "images_F = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/F/*.png')\n",
    "images_G = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/G/*.png')\n",
    "images_H = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/H/*.png')\n",
    "images_I = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/I/*.png')\n",
    "images_J = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/J/*.png')\n",
    "\n",
    "X_data_A = np.zeros((50, 28**2))\n",
    "X_data_B = np.zeros((50, 28**2))\n",
    "X_data_C = np.zeros((50, 28**2))\n",
    "X_data_D = np.zeros((50, 28**2))\n",
    "X_data_E = np.zeros((50, 28**2))\n",
    "X_data_F = np.zeros((50, 28**2))\n",
    "X_data_G = np.zeros((50, 28**2))\n",
    "X_data_H = np.zeros((50, 28**2))\n",
    "X_data_I = np.zeros((50, 28**2))\n",
    "X_data_J = np.zeros((50, 28**2))\n",
    "\n",
    "for i in range(50):\n",
    "    X_data_A[i,:] = np.reshape(np.array(images_A[i]), (1,28**2))/255\n",
    "    X_data_B[i,:] = np.reshape(np.array(images_B[i]), (1,28**2))/255\n",
    "    X_data_C[i,:] = np.reshape(np.array(images_C[i]), (1,28**2))/255\n",
    "    X_data_D[i,:] = np.reshape(np.array(images_D[i]), (1,28**2))/255\n",
    "    X_data_E[i,:] = np.reshape(np.array(images_E[i]), (1,28**2))/255\n",
    "    X_data_F[i,:] = np.reshape(np.array(images_F[i]), (1,28**2))/255\n",
    "    X_data_G[i,:] = np.reshape(np.array(images_G[i]), (1,28**2))/255\n",
    "    X_data_H[i,:] = np.reshape(np.array(images_H[i]), (1,28**2))/255\n",
    "    X_data_I[i,:] = np.reshape(np.array(images_I[i]), (1,28**2))/255\n",
    "    X_data_J[i,:] = np.reshape(np.array(images_J[i]), (1,28**2))/255\n",
    "\n",
    "\n",
    "X_test_out = np.vstack([X_data_A, X_data_B, X_data_C, X_data_D, X_data_E, X_data_F, X_data_G, X_data_H, X_data_I, X_data_J])\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "print(X_test_out.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1060,
   "metadata": {
    "executionInfo": {
     "elapsed": 5,
     "status": "ok",
     "timestamp": 1694123458563,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "QtoumAYBdh4P"
   },
   "outputs": [],
   "source": [
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_NotMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_NotMNIST, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1061,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 15884,
     "status": "ok",
     "timestamp": 1694123474443,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "vqZPvS-3dh7k",
    "outputId": "8254cd69-8191-42dd-f14e-3f7c80cb9067"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(7280, 196)\n"
     ]
    }
   ],
   "source": [
    "test_loader_NotMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_NotMNIST:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_NotMNIST = latent_test_out.detach().numpy()\n",
    "latent_test_out_NotMNIST = latent_test_out_NotMNIST.reshape(-1,4*7*7)\n",
    "print(latent_test_out_NotMNIST.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1062,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4439,
     "status": "ok",
     "timestamp": 1694123478857,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "34usMYYqdh8u",
    "outputId": "d861e8fc-7b34-4191-ba48-fbd931c56172"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(7280, 500)\n",
      "[[326 200  53 ... 257 324 390]\n",
      " [379 447  53 ... 256 359 404]\n",
      " [457 239  53 ... 289 324 404]\n",
      " ...\n",
      " [379 239 234 ... 257 227 288]\n",
      " [326 239 211 ... 257 227 404]\n",
      " [198 386  53 ... 289 324 289]]\n",
      "0.620590621242485\n",
      "0.006332796966359325\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_NotMNIST = et.apply(latent_test_out_NotMNIST)\n",
    "\n",
    "print(leaves_test_out_NotMNIST.shape)\n",
    "print(leaves_test_out_NotMNIST)\n",
    "\n",
    "distances_test_out_NotMNIST = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_NotMNIST[i,j] = hamming(leaves_test_out_NotMNIST[i,:], leaves_test_out_NotMNIST[j,:])\n",
    "\n",
    "score_test_out_NotMNIST = sum(distances_test_out_NotMNIST)/499\n",
    "\n",
    "print(np.mean(score_test_out_NotMNIST))\n",
    "print(np.cov(score_test_out_NotMNIST))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1062,
   "metadata": {
    "executionInfo": {
     "elapsed": 25,
     "status": "ok",
     "timestamp": 1694123478857,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "SniWCeDXdh99"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "tamsyBx9xv2t"
   },
   "source": [
    "## Gaussian"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1063,
   "metadata": {
    "executionInfo": {
     "elapsed": 23,
     "status": "ok",
     "timestamp": 1694123478857,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "efiYSL3HjJa5"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1064,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 739,
     "status": "ok",
     "timestamp": 1694123479573,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "qAcmKgItEge1",
    "outputId": "350e9138-7cdd-48f4-e121-485fa32b7431"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 784)\n",
      "(10000, 1, 28, 28)\n"
     ]
    }
   ],
   "source": [
    "# Gaussian random noise\n",
    "mean_test_out = np.random.uniform(low=0,high=1,size=784)\n",
    "cov_test_out = np.random.rand(784,784)\n",
    "cov_test_out = np.matmul(cov_test_out, cov_test_out.T)\n",
    "X_test_out = np.random.multivariate_normal(mean_test_out, cov_test_out, 10000)\n",
    "X_test_out = MinMaxScaler().fit_transform(X_test_out)\n",
    "print(X_test_out.shape)\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "print(X_test_out.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1065,
   "metadata": {
    "executionInfo": {
     "elapsed": 5,
     "status": "ok",
     "timestamp": 1694123479573,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "i1d4sx8MitCF"
   },
   "outputs": [],
   "source": [
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# train_loader_Gaussian = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, train_loader_Gaussian, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1066,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 838,
     "status": "ok",
     "timestamp": 1694123480408,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "QxSu2wMBxyYr",
    "outputId": "3fd08e4f-3fae-4ab7-97da-487e698b42c8"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 4, 7, 7)\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=10000)\n",
    "\n",
    "for batch in test_loader:\n",
    "    img = batch\n",
    "    img = img.reshape(-1,1,28,28)\n",
    "    # Generating output\n",
    "    #out = model.forward(img)\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_Gaussian = latent_test_out.detach().numpy()\n",
    "print(latent_test_out_Gaussian.shape)\n",
    "latent_test_out_Gaussian = latent_test_out_Gaussian.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Gaussian.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1067,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4333,
     "status": "ok",
     "timestamp": 1694123484737,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "l24-4OTyxyaj",
    "outputId": "36698353-6363-477f-cd6d-073cec39b292"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[216 452 211 ... 286 227 404]\n",
      " [379 452 211 ... 283 324 404]\n",
      " [463 452 211 ... 286 368 404]\n",
      " ...\n",
      " [379 452 211 ... 286 368 404]\n",
      " [100  15 159 ... 293  87   4]\n",
      " [379 452 211 ... 286 368 404]]\n",
      "0.6145674709418838\n",
      "0.0070144680310849986\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Gaussian = et.apply(latent_test_out_Gaussian)\n",
    "\n",
    "print(leaves_test_out_Gaussian.shape)\n",
    "print(leaves_test_out_Gaussian)\n",
    "\n",
    "distances_test_out_Gaussian = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Gaussian[i,j] = hamming(leaves_test_out_Gaussian[i,:], leaves_test_out_Gaussian[j,:])\n",
    "\n",
    "score_test_out_Gaussian = sum(distances_test_out_Gaussian)/499\n",
    "\n",
    "print(np.mean(score_test_out_Gaussian))\n",
    "print(np.cov(score_test_out_Gaussian))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "4Zs0-6kFybMM"
   },
   "source": [
    "## Uniform"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1068,
   "metadata": {
    "executionInfo": {
     "elapsed": 31,
     "status": "ok",
     "timestamp": 1694123484737,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "BHdD_LxEjNmI"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1069,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 30,
     "status": "ok",
     "timestamp": 1694123484738,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "6b5z_lW8xycj",
    "outputId": "3e228ce5-f5ea-4da9-acf0-237494bbe14e"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 784)\n",
      "(10000, 1, 28, 28)\n"
     ]
    }
   ],
   "source": [
    "# Uniform random noise\n",
    "x_min = [0]*784\n",
    "x_max = [1]*784\n",
    "X_test_out = np.random.uniform(low=x_min, high=x_max, size=(10000,784))\n",
    "X_test_out = MinMaxScaler().fit_transform(X_test_out)\n",
    "print(X_test_out.shape)\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "print(X_test_out.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1070,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123484738,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "X6MhxpC2jQU2"
   },
   "outputs": [],
   "source": [
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# train_loader_Uniform = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, train_loader_Uniform, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1071,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1071,
     "status": "ok",
     "timestamp": 1694123485787,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "BG0fLErIxyeZ",
    "outputId": "e6eebde2-7e45-406d-9368-598b3aeda504"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 4, 7, 7)\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=10000)\n",
    "\n",
    "for batch in test_loader:\n",
    "    img = batch\n",
    "    img = img.reshape(-1,1,28,28)\n",
    "    # Generating output\n",
    "    #out = model.forward(img)\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_Uniform = latent_test_out.detach().numpy()\n",
    "print(latent_test_out_Uniform.shape)\n",
    "latent_test_out_Uniform = latent_test_out_Uniform.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Uniform.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1072,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4679,
     "status": "ok",
     "timestamp": 1694123490462,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "FvwHsDP5yif8",
    "outputId": "e664366d-7eef-4d26-daf2-3ec7433c3e85"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[100 249 159 ... 112 324 289]\n",
      " [313 452 205 ... 293 323 289]\n",
      " [100   8 159 ... 281 180 387]\n",
      " ...\n",
      " [100 117 159 ... 281 180 289]\n",
      " [100  15 211 ... 293 227 289]\n",
      " [100 144 159 ... 283 323 289]]\n",
      "0.6103612665330663\n",
      "0.0005644532991188025\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Uniform = et.apply(latent_test_out_Uniform)\n",
    "\n",
    "print(leaves_test_out_Uniform.shape)\n",
    "print(leaves_test_out_Uniform)\n",
    "\n",
    "distances_test_out_Uniform = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Uniform[i,j] = hamming(leaves_test_out_Uniform[i,:], leaves_test_out_Uniform[j,:])\n",
    "\n",
    "score_test_out_Uniform = sum(distances_test_out_Uniform)/499\n",
    "\n",
    "print(np.mean(score_test_out_Uniform))\n",
    "print(np.cov(score_test_out_Uniform))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1072,
   "metadata": {
    "executionInfo": {
     "elapsed": 24,
     "status": "ok",
     "timestamp": 1694123490462,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "N_CKgEZ1yiju"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 1072,
   "metadata": {
    "executionInfo": {
     "elapsed": 23,
     "status": "ok",
     "timestamp": 1694123490463,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "nxm_k1Noyil7"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "FZGej4gIyhMD"
   },
   "source": [
    "# Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1074,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 23,
     "status": "ok",
     "timestamp": 1694123491044,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "xMKKU1PywASB",
    "outputId": "4048ad25-4c0b-43d2-f1f9-184406c58e1a"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.894492\n",
      "0.99984\n",
      "1.0\n",
      "0.9977239999999999\n",
      "0.947526\n",
      "0.944412\n",
      "0.921948\n",
      "1.0\n",
      "0.99956\n",
      "0.44524\n",
      "0.49766\n",
      "1.0\n",
      "0.999912\n",
      "1.0\n",
      "0.99984\n",
      "1.0\n"
     ]
    }
   ],
   "source": [
    "score_pred_Breast = np.concatenate([score_test_in, score_test_out_Breast])\n",
    "score_pred_Chest = np.concatenate([score_test_in, score_test_out_Chest])\n",
    "score_pred_Oct = np.concatenate([score_test_in, score_test_out_Oct])\n",
    "score_pred_Organa = np.concatenate([score_test_in, score_test_out_Organa])\n",
    "score_pred_Organc = np.concatenate([score_test_in, score_test_out_Organc])\n",
    "score_pred_Organs = np.concatenate([score_test_in, score_test_out_Organs])\n",
    "score_pred_Pneum = np.concatenate([score_test_in, score_test_out_Pneum])\n",
    "score_pred_Tissue = np.concatenate([score_test_in, score_test_out_Tissue])\n",
    "score_pred_KMNIST = np.concatenate([score_test_in, score_test_out_KMNIST])\n",
    "score_pred_QMNIST = np.concatenate([score_test_in, score_test_out_QMNIST])\n",
    "score_pred_Omniglot = np.concatenate([score_test_in, score_test_out_Omniglot])\n",
    "score_pred_Cifar10bw = np.concatenate([score_test_in, score_test_out_Cifar10bw])\n",
    "score_pred_NotMNIST = np.concatenate([score_test_in, score_test_out_NotMNIST])\n",
    "score_pred_Gaussian = np.concatenate([score_test_in, score_test_out_Gaussian])\n",
    "score_pred_Uniform = np.concatenate([score_test_in, score_test_out_Uniform])\n",
    "score_true = np.concatenate([np.ones(500), np.zeros(500)])\n",
    "\n",
    "print(roc_auc_score(score_true, score_pred_Breast))\n",
    "print(roc_auc_score(score_true, score_pred_Chest))\n",
    "print(roc_auc_score(score_true, score_pred_Oct))\n",
    "print(roc_auc_score(score_true, score_pred_Organa))\n",
    "print(roc_auc_score(score_true, score_pred_Organc))\n",
    "print(roc_auc_score(score_true, score_pred_Organs))\n",
    "print(roc_auc_score(score_true, score_pred_Pneum))\n",
    "print(roc_auc_score(score_true, score_pred_Tissue))\n",
    "print(roc_auc_score(score_true, score_pred_KMNIST))\n",
    "print(roc_auc_score(score_true, score_pred_QMNIST))\n",
    "print(roc_auc_score(score_true, score_pred_Omniglot))\n",
    "print(roc_auc_score(score_true, score_pred_Cifar10bw))\n",
    "print(roc_auc_score(score_true, score_pred_NotMNIST))\n",
    "print(roc_auc_score(score_true, score_pred_Gaussian))\n",
    "print(roc_auc_score(score_true, score_pred_Uniform))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1075,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 19,
     "status": "ok",
     "timestamp": 1694123491044,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "77iJeZtfwYyj",
    "outputId": "38f97fe8-bea6-4d9a-9f9e-1f8a93e1ff64"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.8329994734773332\n",
      "0.999836342205372\n",
      "1.0\n",
      "0.9961614614171007\n",
      "0.9242389168997818\n",
      "0.897218189044216\n",
      "0.8509486271407842\n",
      "1.0\n",
      "0.9995352025414732\n",
      "0.5252197696550913\n",
      "0.49411139187334396\n",
      "1.0\n",
      "0.999910188930257\n",
      "1.0\n",
      "0.999836342205372\n",
      "1.0\n"
     ]
    }
   ],
   "source": [
    "precision_Breast, recall_Breast, thresholds_Breast = precision_recall_curve(score_true, score_pred_Breast)\n",
    "precision_Chest, recall_Chest, thresholds_Chest = precision_recall_curve(score_true, score_pred_Chest)\n",
    "precision_Oct, recall_Oct, thresholds_Oct = precision_recall_curve(score_true, score_pred_Oct)\n",
    "precision_Organa, recall_Organa, thresholds_Organa = precision_recall_curve(score_true, score_pred_Organa)\n",
    "precision_Organc, recall_Organc, thresholds_Organc = precision_recall_curve(score_true, score_pred_Organc)\n",
    "precision_Organs, recall_Organs, thresholds_Organs = precision_recall_curve(score_true, score_pred_Organs)\n",
    "precision_Pneum, recall_Pneum, thresholds_Pneum = precision_recall_curve(score_true, score_pred_Pneum)\n",
    "precision_Tissue, recall_Tissue, thresholds_Tissue = precision_recall_curve(score_true, score_pred_Tissue)\n",
    "precision_KMNIST, recall_KMNIST, thresholds_KMNIST = precision_recall_curve(score_true, score_pred_KMNIST)\n",
    "precision_QMNIST, recall_QMNIST, thresholds_QMNIST = precision_recall_curve(score_true, score_pred_QMNIST)\n",
    "precision_Omniglot, recall_Omniglot, thresholds_Omniglot = precision_recall_curve(score_true, score_pred_Omniglot)\n",
    "precision_Cifar10bw, recall_Cifar10bw, threshold_Cifar10bw = precision_recall_curve(score_true, score_pred_Cifar10bw)\n",
    "precision_NotMNIST, recall_NotMNIST, thresholds_NotMNIST = precision_recall_curve(score_true, score_pred_NotMNIST)\n",
    "precision_Gaussian, recall_Gaussian, thresholds_Gaussian = precision_recall_curve(score_true, score_pred_Gaussian)\n",
    "precision_Uniform, recall_Uniform, thresholds_Uniform = precision_recall_curve(score_true, score_pred_Uniform)\n",
    "\n",
    "auc_precision_recall_Breast = auc(recall_Breast, precision_Breast)\n",
    "auc_precision_recall_Chest = auc(recall_Chest, precision_Chest)\n",
    "auc_precision_recall_Oct = auc(recall_Oct, precision_Oct)\n",
    "auc_precision_recall_Organa = auc(recall_Organa, precision_Organa)\n",
    "auc_precision_recall_Organc = auc(recall_Organc, precision_Organc)\n",
    "auc_precision_recall_Organs = auc(recall_Organs, precision_Organs)\n",
    "auc_precision_recall_Pneum = auc(recall_Pneum, precision_Pneum)\n",
    "auc_precision_recall_Tissue = auc(recall_Tissue, precision_Tissue)\n",
    "auc_precision_recall_KMNIST = auc(recall_KMNIST, precision_KMNIST)\n",
    "auc_precision_recall_QMNIST = auc(recall_QMNIST, precision_QMNIST)\n",
    "auc_precision_recall_Omniglot = auc(recall_Omniglot, precision_Omniglot)\n",
    "auc_precision_recall_Cifar10bw = auc(recall_Cifar10bw, precision_Cifar10bw)\n",
    "auc_precision_recall_NotMNIST = auc(recall_NotMNIST, precision_NotMNIST)\n",
    "auc_precision_recall_Gaussian = auc(recall_Gaussian, precision_Gaussian)\n",
    "auc_precision_recall_Uniform = auc(recall_Uniform, precision_Uniform)\n",
    "\n",
    "print(auc_precision_recall_Breast)\n",
    "print(auc_precision_recall_Chest)\n",
    "print(auc_precision_recall_Oct)\n",
    "print(auc_precision_recall_Organa)\n",
    "print(auc_precision_recall_Organc)\n",
    "print(auc_precision_recall_Organs)\n",
    "print(auc_precision_recall_Pneum)\n",
    "print(auc_precision_recall_Tissue)\n",
    "print(auc_precision_recall_KMNIST)\n",
    "print(auc_precision_recall_QMNIST)\n",
    "print(auc_precision_recall_Omniglot)\n",
    "print(auc_precision_recall_Cifar10bw)\n",
    "print(auc_precision_recall_NotMNIST)\n",
    "print(auc_precision_recall_Gaussian)\n",
    "print(auc_precision_recall_Uniform)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1076,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 17,
     "status": "ok",
     "timestamp": 1694123491044,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "NESkWnxQR1-0",
    "outputId": "5c293cb5-b53d-4fb3-eca5-9c3bef08ac07"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.278\n",
      "0.0\n",
      "0.0\n",
      "0.006\n",
      "0.172\n",
      "0.116\n",
      "0.136\n",
      "0.0\n",
      "0.002\n",
      "0.998\n",
      "0.924\n",
      "0.0\n",
      "0.0\n",
      "0.0\n",
      "0.0\n",
      "0.0\n"
     ]
    }
   ],
   "source": [
    "def compute_fpr95(y_true, y_pred_probs):\n",
    "    fpr, tpr, thresholds = sklearn.metrics.roc_curve(y_true, y_pred_probs)\n",
    "    idx = np.abs(tpr - 0.95).argmin()\n",
    "    fpr95 = fpr[idx]\n",
    "    return fpr95\n",
    "\n",
    "# Example usage\n",
    "# Assuming you have y_true (true labels) and y_pred_probs (predicted probabilities)\n",
    "fpr95_score_Breast = compute_fpr95(score_true, score_pred_Breast)\n",
    "fpr95_score_Chest = compute_fpr95(score_true, score_pred_Chest)\n",
    "fpr95_score_Oct = compute_fpr95(score_true, score_pred_Oct)\n",
    "fpr95_score_Organa = compute_fpr95(score_true, score_pred_Organa)\n",
    "fpr95_score_Organc = compute_fpr95(score_true, score_pred_Organc)\n",
    "fpr95_score_Organs = compute_fpr95(score_true, score_pred_Organs)\n",
    "fpr95_score_Pneum = compute_fpr95(score_true, score_pred_Pneum)\n",
    "fpr95_score_Tissue = compute_fpr95(score_true, score_pred_Tissue)\n",
    "fpr95_score_KMNIST = compute_fpr95(score_true, score_pred_KMNIST)\n",
    "fpr95_score_QMNIST = compute_fpr95(score_true, score_pred_QMNIST)\n",
    "fpr95_score_Omniglot = compute_fpr95(score_true, score_pred_Omniglot)\n",
    "fpr95_score_NotMNIST = compute_fpr95(score_true, score_pred_NotMNIST)\n",
    "fpr95_score_Cifar10bw = compute_fpr95(score_true, score_pred_Cifar10bw)\n",
    "fpr95_score_Gaussian = compute_fpr95(score_true, score_pred_Gaussian)\n",
    "fpr95_score_Uniform = compute_fpr95(score_true, score_pred_Uniform)\n",
    "\n",
    "print(fpr95_score_Breast)\n",
    "print(fpr95_score_Chest)\n",
    "print(fpr95_score_Oct)\n",
    "print(fpr95_score_Organa)\n",
    "print(fpr95_score_Organc)\n",
    "print(fpr95_score_Organs)\n",
    "print(fpr95_score_Pneum)\n",
    "print(fpr95_score_Tissue)\n",
    "print(fpr95_score_KMNIST)\n",
    "print(fpr95_score_QMNIST)\n",
    "print(fpr95_score_Omniglot)\n",
    "print(fpr95_score_NotMNIST)\n",
    "print(fpr95_score_Cifar10bw)\n",
    "print(fpr95_score_Uniform)\n",
    "print(fpr95_score_Gaussian)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1076,
   "metadata": {
    "executionInfo": {
     "elapsed": 16,
     "status": "ok",
     "timestamp": 1694123491045,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "6OgOveH0R2BF"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 1077,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 16,
     "status": "ok",
     "timestamp": 1694123491045,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "ne3WwJ3iDJmu",
    "outputId": "2d6269ab-0ae6-4260-c083-415335151ae8"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.9471780040080169 0.013737374579823412\n",
      "0.89349619238477 0.04278027255607925\n",
      "0.7313129939879759 0.05429992848372509\n",
      "0.6373530581162324 0.04691403111570002\n",
      "0.6319768336673346 0.07643945699859421\n",
      "0.83064046492986 0.06460451004610498\n",
      "0.8206654909819643 0.06404052768526305\n",
      "0.8312460280561125 0.06386650935155687\n",
      "0.5854379318637275 0.060820976802374145\n",
      "0.6040701563126253 0.08591480009387842\n",
      "0.9500735551102213 0.009025108583268025\n",
      "0.9467801683366742 0.01541214512180387\n",
      "0.45097717034068113 0.051610479496459645\n",
      "0.7999598076152303 0.04022106751190043\n",
      "0.620590621242485 0.07957887261302038\n",
      "0.6145674709418838 0.08375242104611065\n",
      "0.6103612665330663 0.02375822592532537\n"
     ]
    }
   ],
   "source": [
    "print(np.mean(score_test_in), np.sqrt(np.cov(score_test_in)))\n",
    "print(np.mean(score_test_out_Breast), np.sqrt(np.cov(score_test_out_Breast)))\n",
    "print(np.mean(score_test_out_Chest), np.sqrt(np.cov(score_test_out_Chest)))\n",
    "print(np.mean(score_test_out_Oct), np.sqrt(np.cov(score_test_out_Oct)))\n",
    "print(np.mean(score_test_out_Organa), np.sqrt(np.cov(score_test_out_Organa)))\n",
    "print(np.mean(score_test_out_Organc), np.sqrt(np.cov(score_test_out_Organc)))\n",
    "print(np.mean(score_test_out_Organs), np.sqrt(np.cov(score_test_out_Organs)))\n",
    "print(np.mean(score_test_out_Pneum), np.sqrt(np.cov(score_test_out_Pneum)))\n",
    "print(np.mean(score_test_out_Tissue), np.sqrt(np.cov(score_test_out_Tissue)))\n",
    "print(np.mean(score_test_out_KMNIST), np.sqrt(np.cov(score_test_out_KMNIST)))\n",
    "print(np.mean(score_test_out_QMNIST), np.sqrt(np.cov(score_test_out_QMNIST)))\n",
    "print(np.mean(score_test_out_Omniglot), np.sqrt(np.cov(score_test_out_Omniglot)))\n",
    "print(np.mean(score_test_out_Cifar10bw), np.sqrt(np.cov(score_test_out_Cifar10bw)))\n",
    "print(np.mean(score_test_out_NotMNIST), np.sqrt(np.cov(score_test_out_NotMNIST)))\n",
    "print(np.mean(score_test_out_Gaussian), np.sqrt(np.cov(score_test_out_Gaussian)))\n",
    "print(np.mean(score_test_out_Uniform), np.sqrt(np.cov(score_test_out_Uniform)))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1079,
   "metadata": {
    "executionInfo": {
     "elapsed": 12,
     "status": "ok",
     "timestamp": 1694123491046,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "KNUqlxZwebnF"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "executionInfo": {
     "elapsed": 15,
     "status": "aborted",
     "timestamp": 1694096883983,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "CgBZPC9Truem"
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "colab": {
   "authorship_tag": "ABX9TyOtpysuIkpsksm2+0FBUcw6",
   "machine_shape": "hm",
   "provenance": [
    {
     "file_id": "1Fp5qny4ygd5s_dco0cnOGx4MohZmAEiT",
     "timestamp": 1694095668052
    }
   ]
  },
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
