{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 902,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 2305,
     "status": "ok",
     "timestamp": 1694122497790,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Au3Fcvf9ONNZ",
    "outputId": "9e658041-b6a5-46df-ee48-6407af6f375f"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Drive already mounted at /content/gdrive; to attempt to forcibly remount, call drive.mount(\"/content/gdrive\", force_remount=True).\n"
     ]
    }
   ],
   "source": [
    "from google.colab import drive\n",
    "drive.mount('/content/gdrive')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 903,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4221,
     "status": "ok",
     "timestamp": 1694122502008,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "DmeCfBPTjxgJ",
    "outputId": "5d4285b1-411b-4aff-aa25-dc8ae94ffa8f"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requirement already satisfied: PIMS in /usr/local/lib/python3.10/dist-packages (0.6.1)\n",
      "Requirement already satisfied: imageio in /usr/local/lib/python3.10/dist-packages (from PIMS) (2.31.3)\n",
      "Requirement already satisfied: numpy>=1.19 in /usr/local/lib/python3.10/dist-packages (from PIMS) (1.23.5)\n",
      "Requirement already satisfied: slicerator>=0.9.8 in /usr/local/lib/python3.10/dist-packages (from PIMS) (1.1.0)\n",
      "Requirement already satisfied: pillow>=8.3.2 in /usr/local/lib/python3.10/dist-packages (from imageio->PIMS) (9.4.0)\n"
     ]
    }
   ],
   "source": [
    "pip install PIMS"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 905,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4634,
     "status": "ok",
     "timestamp": 1694122511369,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "vOZ-qtazj0pn",
    "outputId": "c011ae23-1f65-49bd-b9a0-2d7ef22985e6"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requirement already satisfied: fastcluster in /usr/local/lib/python3.10/dist-packages (1.2.6)\n",
      "Requirement already satisfied: numpy>=1.9 in /usr/local/lib/python3.10/dist-packages (from fastcluster) (1.23.5)\n"
     ]
    }
   ],
   "source": [
    "pip install fastcluster"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 906,
   "metadata": {
    "executionInfo": {
     "elapsed": 20,
     "status": "ok",
     "timestamp": 1694122511370,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "UFN8FbHYOWnl"
   },
   "outputs": [],
   "source": [
    "import torch\n",
    "import numpy as np\n",
    "from torchvision import datasets\n",
    "import torchvision.transforms as transforms\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import torchvision\n",
    "import torch\n",
    "from torchvision import transforms\n",
    "\n",
    "plt.rcParams['axes.facecolor'] = 'white'\n",
    "plt.rcParams['figure.figsize'] = 9, 6"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 907,
   "metadata": {
    "executionInfo": {
     "elapsed": 19,
     "status": "ok",
     "timestamp": 1694122511370,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "KH8zgcDRj3zg"
   },
   "outputs": [],
   "source": [
    "%matplotlib inline\n",
    "\n",
    "# importing relevant libraries\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import scipy as sp\n",
    "import matplotlib.pyplot as plt\n",
    "import sklearn\n",
    "from sklearn.ensemble import RandomForestClassifier, ExtraTreesClassifier\n",
    "from sklearn.preprocessing import OneHotEncoder, StandardScaler\n",
    "from sklearn.model_selection import cross_val_predict, StratifiedKFold\n",
    "from sklearn.metrics import roc_auc_score, average_precision_score, precision_recall_curve, auc#plot_precision_recall_curve\n",
    "from sklearn.datasets import make_classification\n",
    "from sklearn.preprocessing import MinMaxScaler\n",
    "from tqdm import tqdm\n",
    "from umap import UMAP\n",
    "from pynndescent import NNDescent\n",
    "from fastcluster import single\n",
    "from scipy.cluster.hierarchy import cut_tree, fcluster, dendrogram\n",
    "from scipy.spatial.distance import squareform\n",
    "from sklearn.tree import DecisionTreeClassifier, ExtraTreeClassifier\n",
    "from pims import ImageSequence\n",
    "from PIL import Image\n",
    "from scipy.spatial.distance import hamming\n",
    "import warnings\n",
    "warnings.filterwarnings('ignore')\n",
    "\n",
    "# turning off automatic plot showing, and setting style\n",
    "plt.style.use('bmh')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 908,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 19,
     "status": "ok",
     "timestamp": 1694122511370,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "8iNq7_xZ6WJK",
    "outputId": "0da98a88-2652-40d8-9974-a2f1edb43388"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cpu\n"
     ]
    }
   ],
   "source": [
    "if torch.cuda.is_available():\n",
    "    device = torch.device('cuda')\n",
    "else:\n",
    "    device = torch.device('cpu')\n",
    "\n",
    "print(device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 909,
   "metadata": {
    "executionInfo": {
     "elapsed": 15,
     "status": "ok",
     "timestamp": 1694122511370,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "HrjCzoe8OWqH"
   },
   "outputs": [],
   "source": [
    "# define the NN architecture\n",
    "class ConvAutoencoder(nn.Module):\n",
    "    def __init__(self):\n",
    "        super(ConvAutoencoder, self).__init__()\n",
    "        ## encoder layers ##\n",
    "        # conv layer (depth from 1 --> 16), 3x3 kernels\n",
    "        self.conv1 = nn.Conv2d(1, 16, 3, padding=1)\n",
    "        # conv layer (depth from 16 --> 4), 3x3 kernels\n",
    "        self.conv2 = nn.Conv2d(16, 4, 3, padding=1)\n",
    "        # pooling layer to reduce x-y dims by two; kernel and stride of 2\n",
    "        self.pool = nn.MaxPool2d(2, 2)\n",
    "\n",
    "        ## decoder layers ##\n",
    "        ## a kernel of 2 and a stride of 2 will increase the spatial dims by 2\n",
    "        self.t_conv1 = nn.ConvTranspose2d(4, 16, 2, stride=2)\n",
    "        self.t_conv2 = nn.ConvTranspose2d(16, 1, 2, stride=2)\n",
    "\n",
    "\n",
    "    def forward(self, x):\n",
    "        ## encode ##\n",
    "        # add hidden layers with relu activation function\n",
    "        # and maxpooling after\n",
    "        x = F.relu(self.conv1(x))\n",
    "        x = self.pool(x)\n",
    "        # add second hidden layer\n",
    "        x = F.relu(self.conv2(x))\n",
    "        x = self.pool(x)  # compressed representation\n",
    "\n",
    "        ## decode ##\n",
    "        # add transpose conv layers, with relu activation function\n",
    "        x = F.relu(self.t_conv1(x))\n",
    "        # output layer (with sigmoid for scaling from 0 to 1)\n",
    "        x = F.sigmoid(self.t_conv2(x))\n",
    "\n",
    "        return x\n",
    "\n",
    "    def forward_encoder(self, x):\n",
    "        x = F.relu(self.conv1(x))\n",
    "        x = self.pool(x)\n",
    "        # add second hidden layer\n",
    "        x = F.relu(self.conv2(x))\n",
    "        x = self.pool(x)  # compressed representation\n",
    "\n",
    "        return x\n",
    "\n",
    "\n",
    "# Training function\n",
    "def train(model, train_loader, criterion, optimizer, num_epochs=10, online = False):\n",
    "    model.train()\n",
    "    for epoch in range(num_epochs):\n",
    "        running_loss = 0.0\n",
    "        if not online:\n",
    "            for images in train_loader:\n",
    "                noisy_images = images #+ torch.randn(images.size()) * 0.1  # Adding Gaussian noise\n",
    "                noisy_images = torchvision.transforms.Grayscale(num_output_channels=1)(noisy_images)\n",
    "                optimizer.zero_grad()\n",
    "                outputs = model(noisy_images)\n",
    "                loss = criterion(outputs, images)\n",
    "                loss.backward()\n",
    "                optimizer.step()\n",
    "                running_loss += loss.item()\n",
    "        else:\n",
    "            for images, _ in train_loader:\n",
    "                noisy_images = images #+ torch.randn(images.size()) * 0.1  # Adding Gaussian noise\n",
    "                noisy_images = torchvision.transforms.Grayscale(num_output_channels=1)(noisy_images)\n",
    "                optimizer.zero_grad()\n",
    "                outputs = model(noisy_images)\n",
    "                loss = criterion(outputs, images)\n",
    "                loss.backward()\n",
    "                optimizer.step()\n",
    "                running_loss += loss.item()\n",
    "        print(f\"Epoch [{epoch + 1}/{num_epochs}], Loss: {running_loss / len(train_loader)}\")\n",
    "\n",
    "# Data preprocessing\n",
    "transform = transforms.Compose([\n",
    "    transforms.ToTensor(),\n",
    "])\n",
    "\n",
    "# Initialize the model, criterion, and optimizer\n",
    "model = ConvAutoencoder()\n",
    "criterion = nn.MSELoss()\n",
    "optimizer = torch.optim.Adam(model.parameters(), lr=0.001)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 910,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 516981,
     "status": "ok",
     "timestamp": 1694123028336,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Om9z7Bi4O-sW",
    "outputId": "f2f75376-381a-4da6-924f-25c2c61a40f8"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch [1/30], Loss: 0.03050988048577169\n",
      "Epoch [2/30], Loss: 0.015422411543974427\n",
      "Epoch [3/30], Loss: 0.014152704527589686\n",
      "Epoch [4/30], Loss: 0.01328139442867085\n",
      "Epoch [5/30], Loss: 0.012614572571634229\n",
      "Epoch [6/30], Loss: 0.012169025597104957\n",
      "Epoch [7/30], Loss: 0.011880669234467468\n",
      "Epoch [8/30], Loss: 0.01163484361062426\n",
      "Epoch [9/30], Loss: 0.01147218226496853\n",
      "Epoch [10/30], Loss: 0.011344013919334994\n",
      "Epoch [11/30], Loss: 0.011208372392149559\n",
      "Epoch [12/30], Loss: 0.011123872664906005\n",
      "Epoch [13/30], Loss: 0.011063962379522098\n",
      "Epoch [14/30], Loss: 0.011013341719097992\n",
      "Epoch [15/30], Loss: 0.01097821462343433\n",
      "Epoch [16/30], Loss: 0.01094517709989188\n",
      "Epoch [17/30], Loss: 0.010918215754181781\n",
      "Epoch [18/30], Loss: 0.010894274444325265\n",
      "Epoch [19/30], Loss: 0.010864289473496012\n",
      "Epoch [20/30], Loss: 0.010835678761463557\n",
      "Epoch [21/30], Loss: 0.010811659606741563\n",
      "Epoch [22/30], Loss: 0.010787183902403122\n",
      "Epoch [23/30], Loss: 0.01076234688660674\n",
      "Epoch [24/30], Loss: 0.010744142303390226\n",
      "Epoch [25/30], Loss: 0.010728512378310217\n",
      "Epoch [26/30], Loss: 0.01070939783237255\n",
      "Epoch [27/30], Loss: 0.01069227746749388\n",
      "Epoch [28/30], Loss: 0.010681142782303952\n",
      "Epoch [29/30], Loss: 0.010652797236077503\n",
      "Epoch [30/30], Loss: 0.010627869940571376\n"
     ]
    }
   ],
   "source": [
    "# Load CIFAR-10 data\n",
    "train_dataset = torchvision.datasets.FashionMNIST(root=\".FashionMNIST/train\", train=True, transform=transform, download=True)\n",
    "train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=64, shuffle=True, num_workers=4)\n",
    "\n",
    "# Training the model\n",
    "train(model, train_loader, criterion, optimizer, num_epochs=30, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 911,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 21582,
     "status": "ok",
     "timestamp": 1694123049900,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "bh3Zu2QWO-uq",
    "outputId": "9b2317bd-9957-4ce8-9cdc-d183da934b66"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'torchvision.datasets.mnist.FashionMNIST'>\n",
      "(60000, 1, 28, 28)\n",
      "(60000, 4, 7, 7)\n",
      "(60000,)\n"
     ]
    }
   ],
   "source": [
    "train_dataset = torchvision.datasets.FashionMNIST(root=\".FashionMNIST/train\", train=True, transform=transform, download=True)\n",
    "train_loader = torch.utils.data.DataLoader(train_dataset, batch_size = 60000, shuffle=True)\n",
    "\n",
    "print(type(train_dataset))\n",
    "\n",
    "for batch in train_loader:\n",
    "    img, labels = batch\n",
    "    #img = img.reshape(-1, 28*28)\n",
    "\n",
    "    # Generating output\n",
    "    out = model.forward(img)\n",
    "    latent_train = model.forward_encoder(img)\n",
    "\n",
    "X_train = img.detach().numpy()\n",
    "latent_train = latent_train.detach().numpy()\n",
    "y = labels.detach().numpy()\n",
    "print(X_train.shape)\n",
    "print(latent_train.shape)\n",
    "print(y.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 912,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1253,
     "status": "ok",
     "timestamp": 1694123051124,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "ssO_Le6NP6HZ",
    "outputId": "e42e30ae-fffc-423e-a4fe-73850bde68e4"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(60000, 784)\n",
      "(60000, 196)\n",
      "0.015891340656571416\n",
      "0.1929747039709472\n"
     ]
    }
   ],
   "source": [
    "X_train = X_train.reshape(-1,28*28)\n",
    "latent_train = latent_train.reshape(-1,4*7*7)\n",
    "print(X_train.shape)\n",
    "print(latent_train.shape)\n",
    "print(np.mean(np.cov(X_train.T)))\n",
    "print(np.mean(np.cov(latent_train.T)))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 915,
   "metadata": {
    "executionInfo": {
     "elapsed": 4,
     "status": "ok",
     "timestamp": 1694123093459,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "1a0drLZwEv9u"
   },
   "outputs": [],
   "source": [
    "# y = y[:2400]\n",
    "# latent_train = latent_train[:2400,:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 916,
   "metadata": {
    "executionInfo": {
     "elapsed": 7,
     "status": "ok",
     "timestamp": 1694123093462,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "ZToawVOAkOGV"
   },
   "outputs": [],
   "source": [
    "# np.random.shuffle(y)\n",
    "# print(y)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "k3hp5R2cQCD9"
   },
   "source": [
    "# Tree Model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 917,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 38874,
     "status": "ok",
     "timestamp": 1694123132329,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "R3tnvjyuQKpq",
    "outputId": "46c51d4e-e504-4f44-9ed8-a2ad68a72d65"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Area under the ROC Curve: 0.9805470450617284\n"
     ]
    }
   ],
   "source": [
    "et = ExtraTreesClassifier(n_estimators=500, min_samples_leaf=100,\n",
    "                          max_features='sqrt', bootstrap=True, class_weight='balanced', n_jobs=-1)\n",
    "\n",
    "# et = RandomForestClassifier(n_estimators=500, min_samples_leaf=100,\n",
    "#                           max_features='sqrt', bootstrap=True, class_weight='balanced', n_jobs=-1)\n",
    "\n",
    "# validation instance\n",
    "skf = StratifiedKFold(n_splits=5, shuffle=True)\n",
    "\n",
    "# getting the model validation predictions\n",
    "preds = cross_val_predict(et, latent_train, y, cv=skf, method='predict_proba')\n",
    "\n",
    "# evaluating the model\n",
    "print('Area under the ROC Curve:', roc_auc_score(y, preds, multi_class='ovo'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 918,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 92
    },
    "executionInfo": {
     "elapsed": 10231,
     "status": "ok",
     "timestamp": 1694123142536,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "T2zHZflUQlOr",
    "outputId": "9bf9f7a1-8bbf-4b47-f7b3-06aa8ef26ba8"
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<style>#sk-container-id-10 {color: black;background-color: white;}#sk-container-id-10 pre{padding: 0;}#sk-container-id-10 div.sk-toggleable {background-color: white;}#sk-container-id-10 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-10 label.sk-toggleable__label-arrow:before {content: \"▸\";float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-10 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-10 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-10 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-10 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-10 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-10 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content: \"▾\";}#sk-container-id-10 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-10 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-10 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-10 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-10 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-10 div.sk-parallel-item::after {content: \"\";width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-10 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-10 div.sk-serial::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-10 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-10 div.sk-item {position: relative;z-index: 1;}#sk-container-id-10 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-10 div.sk-item::before, #sk-container-id-10 div.sk-parallel-item::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-10 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-10 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-10 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-10 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-10 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-10 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-10 div.sk-label-container {text-align: center;}#sk-container-id-10 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-10 div.sk-text-repr-fallback {display: none;}</style><div id=\"sk-container-id-10\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>ExtraTreesClassifier(bootstrap=True, class_weight=&#x27;balanced&#x27;,\n",
       "                     min_samples_leaf=100, n_estimators=500, n_jobs=-1)</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-10\" type=\"checkbox\" checked><label for=\"sk-estimator-id-10\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">ExtraTreesClassifier</label><div class=\"sk-toggleable__content\"><pre>ExtraTreesClassifier(bootstrap=True, class_weight=&#x27;balanced&#x27;,\n",
       "                     min_samples_leaf=100, n_estimators=500, n_jobs=-1)</pre></div></div></div></div></div>"
      ],
      "text/plain": [
       "ExtraTreesClassifier(bootstrap=True, class_weight='balanced',\n",
       "                     min_samples_leaf=100, n_estimators=500, n_jobs=-1)"
      ]
     },
     "execution_count": 918,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "et.fit(latent_train,y)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 919,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4806,
     "status": "ok",
     "timestamp": 1694123147339,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "6tMnYzZ_VPZR",
    "outputId": "6dcce478-6d50-4f0d-9d0e-ffc118f3f870"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(60000, 500)\n",
      "[[ 39 450 280 ... 437  35 413]\n",
      " [428 189 294 ... 307 404  54]\n",
      " [113 337 408 ... 197 225  20]\n",
      " ...\n",
      " [ 43 206 325 ... 415 398  43]\n",
      " [453 134 135 ...  73 419 117]\n",
      " [228 314 438 ... 394 190 240]]\n",
      "0.9943195991983964\n",
      "9.242378192958237e-06\n"
     ]
    }
   ],
   "source": [
    "leaves_train = et.apply(latent_train)\n",
    "print(leaves_train.shape)\n",
    "print(leaves_train)\n",
    "\n",
    "distances_train = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_train[i,j] = hamming(leaves_train[i,:], leaves_train[j,:])\n",
    "\n",
    "score_train = sum(distances_train)/499\n",
    "\n",
    "print(np.mean(score_train))\n",
    "print(np.cov(score_train))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 920,
   "metadata": {
    "executionInfo": {
     "elapsed": 14,
     "status": "ok",
     "timestamp": 1694123147340,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Q55SNuDNhQQ1"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# torch.save(model.state_dict(), path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 921,
   "metadata": {
    "executionInfo": {
     "elapsed": 14,
     "status": "ok",
     "timestamp": 1694123147340,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "0hpY3jsdhQUb"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "U6SnpaEVWOQf"
   },
   "source": [
    "# Testing on ID Data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 922,
   "metadata": {
    "executionInfo": {
     "elapsed": 13,
     "status": "ok",
     "timestamp": 1694123147340,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "R6olj5rRmTpo"
   },
   "outputs": [],
   "source": [
    "#num_epoch = 30"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 923,
   "metadata": {
    "executionInfo": {
     "elapsed": 13,
     "status": "ok",
     "timestamp": 1694123147340,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "BLgLZ7STVPbU"
   },
   "outputs": [],
   "source": [
    "# test_dataset_MNIST = torchvision.datasets.MNIST(root=\".MNIST/test\", train=False, transform=transform, download=True)\n",
    "# test_loader_MNIST = torch.utils.data.DataLoader(test_dataset_MNIST, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_MNIST, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 924,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4965,
     "status": "ok",
     "timestamp": 1694123152292,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "zM65LrAhVPda",
    "outputId": "ad044cc6-bdbc-4fdc-b929-db7ad8f26a17"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 1, 28, 28)\n",
      "(10000, 4, 7, 7)\n",
      "(10000, 784)\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "test_dataset_MNIST = torchvision.datasets.FashionMNIST(root=\".FashionMNIST/test\", train=False, transform=transform, download=True)\n",
    "test_loader_MNIST = torch.utils.data.DataLoader(test_dataset_MNIST, batch_size = 10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_MNIST:\n",
    "    img, _ = batch\n",
    "    #img = torchvision.transforms.Grayscale(num_output_channels=1)(img)\n",
    "    #img = img.reshape(-1, 28*28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test = latent_test.detach().numpy()\n",
    "X_test = img.detach().numpy()\n",
    "print(X_test.shape)\n",
    "print(latent_test.shape)\n",
    "X_test = X_test.reshape(-1,1*28*28)\n",
    "latent_test = latent_test.reshape(-1,4*7*7)\n",
    "print(X_test.shape)\n",
    "print(latent_test.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 925,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4014,
     "status": "ok",
     "timestamp": 1694123156284,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "5l77BQBXVPfP",
    "outputId": "1a108ead-5755-42ef-bfef-badc50598c4d"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[154 436 352 ... 374 325 394]\n",
      " [428 132 316 ... 263 418 464]\n",
      " [325 454 468 ... 450  46 418]\n",
      " ...\n",
      " [410 202 126 ... 137 404 158]\n",
      " [335 120  16 ... 169  66 166]\n",
      " [354 124  34 ... 150  66 159]]\n",
      "0.9676757194388776\n",
      "0.0002334108994135478\n"
     ]
    }
   ],
   "source": [
    "latent_test_in = latent_test\n",
    "\n",
    "leaves_test_in = et.apply(latent_test_in)\n",
    "print(leaves_test_in.shape)\n",
    "print(leaves_test_in)\n",
    "\n",
    "distances_test_in = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_in[i,j] = hamming(leaves_test_in[i,:], leaves_test_in[j,:])\n",
    "\n",
    "score_test_in = sum(distances_test_in)/499\n",
    "print(np.mean(score_test_in))\n",
    "print(np.cov(score_test_in))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "zKHeKNSXWZQr"
   },
   "source": [
    "# Testing on OOD Data"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "DQgAh1gaXxP6"
   },
   "source": [
    "## MNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 926,
   "metadata": {
    "executionInfo": {
     "elapsed": 23,
     "status": "ok",
     "timestamp": 1694123156284,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "DTO-dHR3hkcS"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 927,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1237,
     "status": "ok",
     "timestamp": 1694123157500,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "U6-VmvGdWLPA",
    "outputId": "20cfa6ab-03e1-4de9-c3d7-5a6d347db593"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 1, 28, 28)\n"
     ]
    }
   ],
   "source": [
    "df_test_out = pd.read_csv('/content/gdrive/MyDrive/TOOD/datasets/mnist_test.csv')\n",
    "data_test_out = np.array(df_test_out)\n",
    "\n",
    "X_test_out = data_test_out[:, 1:785]/255\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "print(X_test_out.shape)\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Fashion = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Fashion, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 928,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 2559,
     "status": "ok",
     "timestamp": 1694123160056,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "G-T51piGWLRU",
    "outputId": "8537747b-224f-46f9-9c14-a87f34620bb9"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 4, 7, 7)\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Fashion = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Fashion:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Fashion = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Fashion.shape)\n",
    "latent_test_out_Fashion = latent_test_out_Fashion.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Fashion.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 929,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4535,
     "status": "ok",
     "timestamp": 1694123164588,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "RMYCE2rXYeqT",
    "outputId": "17b08547-39e0-439c-b39f-92a001259e5d"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[461 159  17 ...  77  66 418]\n",
      " [327 178   7 ... 110  80 463]\n",
      " [475 169  16 ... 104  50 418]\n",
      " ...\n",
      " [477 129  17 ... 111  50 463]\n",
      " [376 176 157 ... 169 433 418]\n",
      " [480 159  17 ...  77  50 463]]\n",
      "0.7290740681362725\n",
      "0.0029402485450191604\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Fashion = et.apply(latent_test_out_Fashion)\n",
    "\n",
    "print(leaves_test_out_Fashion.shape)\n",
    "print(leaves_test_out_Fashion)\n",
    "\n",
    "distances_test_out_Fashion = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Fashion[i,j] = hamming(leaves_test_out_Fashion[i,:], leaves_test_out_Fashion[j,:])\n",
    "\n",
    "score_test_out_Fashion = sum(distances_test_out_Fashion)/499\n",
    "\n",
    "print(np.mean(score_test_out_Fashion))\n",
    "print(np.cov(score_test_out_Fashion))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "hNZJuuwNO5AV"
   },
   "source": [
    "## BreastMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 930,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123164589,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "I8rDNw7QO6U5"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 931,
   "metadata": {
    "executionInfo": {
     "elapsed": 21,
     "status": "ok",
     "timestamp": 1694123164589,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "TMX1QtM7O6cF"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/breastmnist.npz')\n",
    "#X_test_out = df['test_images']/255\n",
    "[size, _, _] = df['train_images'].shape\n",
    "X_test_out = df['train_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_ChestMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_ChestMNIST, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 932,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 20,
     "status": "ok",
     "timestamp": 1694123164589,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "5_rUSplcO6eF",
    "outputId": "023a6c57-a724-4dc0-f7ba-99e7d6b8dbe2"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "546\n",
      "(546, 4, 7, 7)\n",
      "(546, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['train_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_BreastMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_BreastMNIST:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Breast = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Breast.shape)\n",
    "latent_test_out_Breast = latent_test_out_Breast.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Breast.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 933,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4706,
     "status": "ok",
     "timestamp": 1694123169276,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "XJ8p4wDAO6f4",
    "outputId": "bb56fb6a-4cab-441e-ef4c-86d507025a0b"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(546, 500)\n",
      "[[341 336 145 ... 204 225 298]\n",
      " [  6 336 164 ... 204  83 298]\n",
      " [  6 254 164 ... 196  83 290]\n",
      " ...\n",
      " [  6 254 164 ... 215 116 297]\n",
      " [  6 254 164 ... 210 116 298]\n",
      " [180 253 177 ... 218 164 297]]\n",
      "0.757487871743487\n",
      "0.003992812935734875\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Breast = et.apply(latent_test_out_Breast)\n",
    "\n",
    "print(leaves_test_out_Breast.shape)\n",
    "print(leaves_test_out_Breast)\n",
    "\n",
    "distances_test_out_Breast = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Breast[i,j] = hamming(leaves_test_out_Breast[i,:], leaves_test_out_Breast[j,:])\n",
    "\n",
    "score_test_out_Breast = sum(distances_test_out_Breast)/499\n",
    "\n",
    "print(np.mean(score_test_out_Breast))\n",
    "print(np.cov(score_test_out_Breast))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "1vkCzIAMy5Yi"
   },
   "source": [
    "## ChestMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 934,
   "metadata": {
    "executionInfo": {
     "elapsed": 11,
     "status": "ok",
     "timestamp": 1694123169277,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "-I7QZNVUhnpI"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 935,
   "metadata": {
    "executionInfo": {
     "elapsed": 10,
     "status": "ok",
     "timestamp": 1694123169277,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "3Nh3znXBv1za"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/chestmnist.npz')\n",
    "#X_test_out = df['test_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_ChestMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_ChestMNIST, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 936,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 7160,
     "status": "ok",
     "timestamp": 1694123176427,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "FFfdi--zv12B",
    "outputId": "34f570ca-43a8-42e4-b5cf-2c259a25e4af"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "22433\n",
      "(22433, 4, 7, 7)\n",
      "(22433, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_ChestMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_ChestMNIST:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Chest = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Chest.shape)\n",
    "latent_test_out_Chest = latent_test_out_Chest.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Chest.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 937,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4472,
     "status": "ok",
     "timestamp": 1694123180873,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "hLfKbVMzzxUi",
    "outputId": "d38489a1-8407-4a8f-bb4d-1dd83390f971"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(22433, 500)\n",
      "[[  6 101 178 ... 194 134 290]\n",
      " [  6 336 177 ... 244 139 290]\n",
      " [  6 101 177 ... 189 163 290]\n",
      " ...\n",
      " [  6 336 177 ... 244 208 290]\n",
      " [  6 101 327 ... 252 208 290]\n",
      " [  6 336 178 ... 194 164 290]]\n",
      "0.7052959839679358\n",
      "0.0061317927309174165\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Chest = et.apply(latent_test_out_Chest)\n",
    "\n",
    "print(leaves_test_out_Chest.shape)\n",
    "print(leaves_test_out_Chest)\n",
    "\n",
    "distances_test_out_Chest = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Chest[i,j] = hamming(leaves_test_out_Chest[i,:], leaves_test_out_Chest[j,:])\n",
    "\n",
    "score_test_out_Chest = sum(distances_test_out_Chest)/499\n",
    "\n",
    "print(np.mean(score_test_out_Chest))\n",
    "print(np.cov(score_test_out_Chest))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "Kuwv43MpPUjD"
   },
   "source": [
    "## OctMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 938,
   "metadata": {
    "executionInfo": {
     "elapsed": 23,
     "status": "ok",
     "timestamp": 1694123180874,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "MI5QlskOPWn1"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 939,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123180874,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "xIQbJtWjPWp8"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/octmnist.npz')\n",
    "#X_test_out = df['test_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_ChestMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_ChestMNIST, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 940,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 291,
     "status": "ok",
     "timestamp": 1694123181143,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "KKOyE9byPWr-",
    "outputId": "206fe657-d899-4487-91b8-9edec9167c55"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1000\n",
      "(1000, 4, 7, 7)\n",
      "(1000, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_OctMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_OctMNIST:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Oct = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Oct.shape)\n",
    "latent_test_out_Oct = latent_test_out_Oct.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Oct.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 941,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4331,
     "status": "ok",
     "timestamp": 1694123185470,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "yzjA0YdpPWtk",
    "outputId": "5715442e-753f-41b2-d5bb-f061a194ce42"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(1000, 500)\n",
      "[[  6 336 164 ... 193 116 298]\n",
      " [  6  43 145 ... 108 201 298]\n",
      " [  6  50 157 ...  19 201 298]\n",
      " ...\n",
      " [  6 284 168 ... 263 439  25]\n",
      " [  6  43 157 ...   7 208 298]\n",
      " [  6 254 164 ... 193 422 298]]\n",
      "0.7772529378757516\n",
      "0.0017965739424413076\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Oct = et.apply(latent_test_out_Oct)\n",
    "\n",
    "print(leaves_test_out_Oct.shape)\n",
    "print(leaves_test_out_Oct)\n",
    "\n",
    "distances_test_out_Oct = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Oct[i,j] = hamming(leaves_test_out_Oct[i,:], leaves_test_out_Oct[j,:])\n",
    "\n",
    "score_test_out_Oct = sum(distances_test_out_Oct)/499\n",
    "\n",
    "print(np.mean(score_test_out_Oct))\n",
    "print(np.cov(score_test_out_Oct))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "_Tguoeb3Nosv"
   },
   "source": [
    "## PneumMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 942,
   "metadata": {
    "executionInfo": {
     "elapsed": 13,
     "status": "ok",
     "timestamp": 1694123185470,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "yhageUDChpGt"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 943,
   "metadata": {
    "executionInfo": {
     "elapsed": 13,
     "status": "ok",
     "timestamp": 1694123185470,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "SJN2w-zVzxWm"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/pneumoniamnist.npz')\n",
    "#X_test_out = df['train_images']/255\n",
    "[size, _, _] = df['train_images'].shape\n",
    "X_test_out = df['train_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Pneum = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Pneum, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 944,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 2276,
     "status": "ok",
     "timestamp": 1694123187734,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "zmGFQYZvNtiL",
    "outputId": "6d6c3150-53e9-47bd-f1de-84d85b05dca8"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "4708\n",
      "(4708, 4, 7, 7)\n",
      "(4708, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['train_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Pneum = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Pneum:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Pneum = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Pneum.shape)\n",
    "latent_test_out_Pneum = latent_test_out_Pneum.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Pneum.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 945,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4300,
     "status": "ok",
     "timestamp": 1694123192026,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "9SuNE4aSNt7b",
    "outputId": "033657a3-a437-402b-bf28-90e5ef8412d6"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(4708, 500)\n",
      "[[  6 253 177 ... 225 139 290]\n",
      " [  6 253 177 ... 193 139 290]\n",
      " [  6 253 177 ... 225 153 290]\n",
      " ...\n",
      " [  6 253 177 ... 225 121 290]\n",
      " [  6 253 177 ... 215 151 290]\n",
      " [  6 253 177 ... 215 139 290]]\n",
      "0.511020889779559\n",
      "0.004233655245979071\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Pneum = et.apply(latent_test_out_Pneum)\n",
    "\n",
    "print(leaves_test_out_Pneum.shape)\n",
    "print(leaves_test_out_Pneum)\n",
    "\n",
    "distances_test_out_Pneum = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Pneum[i,j] = hamming(leaves_test_out_Pneum[i,:], leaves_test_out_Pneum[j,:])\n",
    "\n",
    "score_test_out_Pneum = sum(distances_test_out_Pneum)/499\n",
    "\n",
    "print(np.mean(score_test_out_Pneum))\n",
    "print(np.cov(score_test_out_Pneum))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "o1iY4vTXPlN-"
   },
   "source": [
    "## OrganaMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 946,
   "metadata": {
    "executionInfo": {
     "elapsed": 24,
     "status": "ok",
     "timestamp": 1694123192027,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Eg8cWRsQPmdX"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 947,
   "metadata": {
    "executionInfo": {
     "elapsed": 741,
     "status": "ok",
     "timestamp": 1694123192746,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "sQSXQXVxPmf6"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/organamnist.npz')\n",
    "#X_test_out = df['train_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Organc = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Organc, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 948,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 6002,
     "status": "ok",
     "timestamp": 1694123198743,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "-hl_Di8dPmhQ",
    "outputId": "0ef811a5-b18d-4df1-bc29-534b01f54492"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "17778\n",
      "(17778, 4, 7, 7)\n",
      "(17778, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Organa = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Organa:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Organa = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Organa.shape)\n",
    "latent_test_out_Organa = latent_test_out_Organa.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Organa.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 949,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4705,
     "status": "ok",
     "timestamp": 1694123203436,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "QTVnysAIPmjU",
    "outputId": "7842769b-cb0b-4cf6-fdf8-81444d58f068"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(17778, 500)\n",
      "[[130 336 331 ... 222 195 327]\n",
      " [  6 253 183 ... 189 139 290]\n",
      " [260 322 442 ... 287 235 257]\n",
      " ...\n",
      " [  6 253 172 ... 222 153 290]\n",
      " [ 70 264 144 ... 210 273 312]\n",
      " [  6 253 177 ... 215 209 290]]\n",
      "0.8572637274549102\n",
      "0.007295778112004953\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Organa = et.apply(latent_test_out_Organa)\n",
    "\n",
    "print(leaves_test_out_Organa.shape)\n",
    "print(leaves_test_out_Organa)\n",
    "\n",
    "distances_test_out_Organa = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Organa[i,j] = hamming(leaves_test_out_Organa[i,:], leaves_test_out_Organa[j,:])\n",
    "\n",
    "score_test_out_Organa = sum(distances_test_out_Organa)/499\n",
    "\n",
    "print(np.mean(score_test_out_Organa))\n",
    "print(np.cov(score_test_out_Organa))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "UEKwndGfCmv6"
   },
   "source": [
    "## OrgancMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 950,
   "metadata": {
    "executionInfo": {
     "elapsed": 14,
     "status": "ok",
     "timestamp": 1694123203437,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "J1GLB1jDh3uE"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 951,
   "metadata": {
    "executionInfo": {
     "elapsed": 13,
     "status": "ok",
     "timestamp": 1694123203437,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "6OlXP64YNuYF"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/organcmnist.npz')\n",
    "#X_test_out = df['train_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Organc = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Organc, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 952,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 3393,
     "status": "ok",
     "timestamp": 1694123206817,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "GneANgXlNuoo",
    "outputId": "17ed4021-db9d-4d31-bbe3-ce936e6a14ab"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "8268\n",
      "(8268, 4, 7, 7)\n",
      "(8268, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Organc = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Organc:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Organc = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Organc.shape)\n",
    "latent_test_out_Organc = latent_test_out_Organc.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Organc.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 953,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4264,
     "status": "ok",
     "timestamp": 1694123211070,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "poQYWGAOC5gL",
    "outputId": "29607832-7ad7-448e-c2f4-ad6fe24bcc68"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(8268, 500)\n",
      "[[  6 253 172 ... 225 164 290]\n",
      " [  6 336 362 ... 215 164 303]\n",
      " [466 391 177 ... 469 121 428]\n",
      " ...\n",
      " [  6 254 177 ... 244 127 290]\n",
      " [  6 253 333 ... 215 195 290]\n",
      " [ 42 336 188 ... 215 272 327]]\n",
      "0.8289275511022047\n",
      "0.008034913619194667\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Organc = et.apply(latent_test_out_Organc)\n",
    "\n",
    "print(leaves_test_out_Organc.shape)\n",
    "print(leaves_test_out_Organc)\n",
    "\n",
    "distances_test_out_Organc = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Organc[i,j] = hamming(leaves_test_out_Organc[i,:], leaves_test_out_Organc[j,:])\n",
    "\n",
    "score_test_out_Organc = sum(distances_test_out_Organc)/499\n",
    "\n",
    "print(np.mean(score_test_out_Organc))\n",
    "print(np.cov(score_test_out_Organc))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "S9qWBt2uP5Iq"
   },
   "source": [
    "## OrgansMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 954,
   "metadata": {
    "executionInfo": {
     "elapsed": 23,
     "status": "ok",
     "timestamp": 1694123211071,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "hUVdNi9sP6ma"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 955,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123211071,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "fdtvZMXhP6od"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/organsmnist.npz')\n",
    "#X_test_out = df['train_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Organc = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Organc, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 956,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 3380,
     "status": "ok",
     "timestamp": 1694123214430,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "RhHM9LdQP6qW",
    "outputId": "c4be8943-ca90-4fa6-ab09-028a941e3bc6"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "8829\n",
      "(8829, 4, 7, 7)\n",
      "(8829, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Organs = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Organs:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Organs = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Organs.shape)\n",
    "latent_test_out_Organs = latent_test_out_Organs.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Organs.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 957,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4507,
     "status": "ok",
     "timestamp": 1694123218935,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "0SJuP7e4P6sI",
    "outputId": "00eed695-d6b1-42fa-9dc4-f627b66d3093"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(8829, 500)\n",
      "[[  6 253 177 ... 244 164 290]\n",
      " [  6 336 172 ... 215 195 315]\n",
      " [  6 254 177 ... 193 121 290]\n",
      " ...\n",
      " [  6 222 426 ... 245 201 315]\n",
      " [ 44 254 336 ... 210 163 290]\n",
      " [480 128 157 ... 158 351 441]]\n",
      "0.8284305571142286\n",
      "0.008022785498374166\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Organs = et.apply(latent_test_out_Organs)\n",
    "\n",
    "print(leaves_test_out_Organs.shape)\n",
    "print(leaves_test_out_Organs)\n",
    "\n",
    "distances_test_out_Organs = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Organs[i,j] = hamming(leaves_test_out_Organs[i,:], leaves_test_out_Organs[j,:])\n",
    "\n",
    "score_test_out_Organs = sum(distances_test_out_Organs)/499\n",
    "\n",
    "print(np.mean(score_test_out_Organs))\n",
    "print(np.cov(score_test_out_Organs))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "PK_cY3XVDxlQ"
   },
   "source": [
    "## TissueMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 958,
   "metadata": {
    "executionInfo": {
     "elapsed": 12,
     "status": "ok",
     "timestamp": 1694123218935,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "rXhtk9Mah8mR"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 959,
   "metadata": {
    "executionInfo": {
     "elapsed": 1229,
     "status": "ok",
     "timestamp": 1694123220152,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "ViCtSF5iC5ie"
   },
   "outputs": [],
   "source": [
    "df = np.load('/content/gdrive/MyDrive/TOOD/datasets/tissuemnist.npz')\n",
    "#X_test_out = df['test_images']/255\n",
    "[size, _, _] = df['test_images'].shape\n",
    "X_test_out = df['test_images'].reshape((size, 784))/255\n",
    "\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "\n",
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_Tissue = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Tissue, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 960,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 14380,
     "status": "ok",
     "timestamp": 1694123234529,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "iSIHWqqOC5kT",
    "outputId": "2f1eed2a-a324-4995-b8ac-1b64b39f8e82"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "47280\n",
      "(47280, 4, 7, 7)\n",
      "(47280, 196)\n"
     ]
    }
   ],
   "source": [
    "[size, _, _] = df['test_images'].shape\n",
    "print(size)\n",
    "\n",
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader_Tissue = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=size, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Tissue:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_Tissue = latent_test_out.detach().numpy()\n",
    "#latent_test_out = latent_test_out[0,:,:]\n",
    "print(latent_test_out_Tissue.shape)\n",
    "latent_test_out_Tissue = latent_test_out_Tissue.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Tissue.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 961,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5246,
     "status": "ok",
     "timestamp": 1694123239748,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "IUQ3nT57Egcv",
    "outputId": "8f982701-c2b7-4742-9c69-3f0170ffe752"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(47280, 500)\n",
      "[[466  44 133 ...  19 232  25]\n",
      " [  5  46  22 ...  19 204  25]\n",
      " [  6  44   6 ...  19 101  25]\n",
      " ...\n",
      " [  5  47  99 ... 193 219 325]\n",
      " [  6  98 145 ... 467 201  25]\n",
      " [358  61 157 ... 108 422 425]]\n",
      "0.8148208737474949\n",
      "0.0017425242165510766\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Tissue = et.apply(latent_test_out_Tissue)\n",
    "\n",
    "print(leaves_test_out_Tissue.shape)\n",
    "print(leaves_test_out_Tissue)\n",
    "\n",
    "distances_test_out_Tissue = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Tissue[i,j] = hamming(leaves_test_out_Tissue[i,:], leaves_test_out_Tissue[j,:])\n",
    "\n",
    "score_test_out_Tissue = sum(distances_test_out_Tissue)/499\n",
    "\n",
    "print(np.mean(score_test_out_Tissue))\n",
    "print(np.cov(score_test_out_Tissue))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "V9pDbbT2Q9xv"
   },
   "source": [
    "## KMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 962,
   "metadata": {
    "executionInfo": {
     "elapsed": 25,
     "status": "ok",
     "timestamp": 1694123239749,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "e7-UM77Fh-w-"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 963,
   "metadata": {
    "executionInfo": {
     "elapsed": 23,
     "status": "ok",
     "timestamp": 1694123239749,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "4BiRKanXxvFv"
   },
   "outputs": [],
   "source": [
    "# test_dataset_KMNIST = torchvision.datasets.KMNIST(root=\"./data\", train=False, transform=transform, download=True)\n",
    "# test_loader_KMNIST = torch.utils.data.DataLoader(test_dataset_KMNIST, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_KMNIST, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 964,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5102,
     "status": "ok",
     "timestamp": 1694123244828,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "IrDPmFlTxvH4",
    "outputId": "e60d1a03-abf6-4aba-eb0d-1db2f7fadc6d"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "transform = transforms.Compose(\n",
    "    [transforms.Resize((28, 28)),  # Resize images to match the size of MNIST\n",
    "     transforms.ToTensor()])\n",
    "\n",
    "test_dataset_KMNIST = torchvision.datasets.KMNIST(root='./data', train=False, download=True, transform=transform)\n",
    "test_loader_KMNIST = torch.utils.data.DataLoader(test_dataset_KMNIST, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_KMNIST:\n",
    "    img, _ = batch\n",
    "    #img = torchvision.transforms.Grayscale(num_output_channels=1)(img)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_KMNIST = latent_test_out.detach().numpy()\n",
    "latent_test_out_KMNIST = latent_test_out_KMNIST.reshape(-1,4*7*7)\n",
    "print(latent_test_out_KMNIST.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 965,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4442,
     "status": "ok",
     "timestamp": 1694123249248,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "WqFrdnepRkI7",
    "outputId": "415d11ad-0dbe-4914-8c9d-a8d9fe0556be"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[461 467 157 ... 111  80 444]\n",
      " [479 467 157 ...  77 331 464]\n",
      " [477 134 468 ... 470 426 464]\n",
      " ...\n",
      " [477 344 317 ... 162 419 441]\n",
      " [359 134 468 ...  95 439 464]\n",
      " [313 129 464 ... 457 453 448]]\n",
      "0.8934494589178358\n",
      "0.0007977316696098843\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_KMNIST = et.apply(latent_test_out_KMNIST)\n",
    "\n",
    "print(leaves_test_out_KMNIST.shape)\n",
    "print(leaves_test_out_KMNIST)\n",
    "\n",
    "distances_test_out_KMNIST = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_KMNIST[i,j] = hamming(leaves_test_out_KMNIST[i,:], leaves_test_out_KMNIST[j,:])\n",
    "\n",
    "score_test_out_KMNIST = sum(distances_test_out_KMNIST)/499\n",
    "\n",
    "print(np.mean(score_test_out_KMNIST))\n",
    "print(np.cov(score_test_out_KMNIST))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "brj6eAE_SJn2"
   },
   "source": [
    "## QMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 966,
   "metadata": {
    "executionInfo": {
     "elapsed": 28,
     "status": "ok",
     "timestamp": 1694123249252,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "dIaTRR3kif-b"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 967,
   "metadata": {
    "executionInfo": {
     "elapsed": 27,
     "status": "ok",
     "timestamp": 1694123249252,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "1iG0aHi7xvJH"
   },
   "outputs": [],
   "source": [
    "# test_dataset_QMNIST = torchvision.datasets.QMNIST(root=\"./data\", train=False, transform=transform, download=True)\n",
    "# test_loader_QMNIST = torch.utils.data.DataLoader(test_dataset_QMNIST, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_QMNIST, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 968,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 44549,
     "status": "ok",
     "timestamp": 1694123293776,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "gXmIqYEnSMZs",
    "outputId": "e0838eab-2b5d-429e-aad0-df1282ffa19b"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "transform = transforms.Compose(\n",
    "    [transforms.Resize((28, 28)),  # Resize images to match the size of MNIST\n",
    "     transforms.ToTensor()])\n",
    "\n",
    "test_dataset_QMNIST = torchvision.datasets.QMNIST(root='./data', train=False, download=True, transform=transform)\n",
    "test_loader_QMNIST = torch.utils.data.DataLoader(test_dataset_QMNIST, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_QMNIST:\n",
    "    img, _ = batch\n",
    "    #img = torchvision.transforms.Grayscale(num_output_channels=1)(img)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_QMNIST = latent_test_out.detach().numpy()\n",
    "latent_test_out_QMNIST = latent_test_out_QMNIST.reshape(-1,4*7*7)\n",
    "print(latent_test_out_QMNIST.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 969,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 5045,
     "status": "ok",
     "timestamp": 1694123298797,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "OW51VvQQSMbw",
    "outputId": "4d1ef0b1-1ebb-4291-ff27-f8fab18a6491"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[327 159  17 ... 168  50 463]\n",
      " [480 134  17 ...  81  67 452]\n",
      " [454  75 442 ...  77  66 418]\n",
      " ...\n",
      " [316 129 157 ... 168  66 462]\n",
      " [479 177  17 ... 169 427 463]\n",
      " [479 133  17 ... 111  67 462]]\n",
      "0.7437405210420841\n",
      "0.0024396926879473664\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_QMNIST = et.apply(latent_test_out_QMNIST)\n",
    "\n",
    "print(leaves_test_out_QMNIST.shape)\n",
    "print(leaves_test_out_QMNIST)\n",
    "\n",
    "distances_test_out_QMNIST = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_QMNIST[i,j] = hamming(leaves_test_out_QMNIST[i,:], leaves_test_out_QMNIST[j,:])\n",
    "\n",
    "score_test_out_QMNIST = sum(distances_test_out_QMNIST)/499\n",
    "\n",
    "print(np.mean(score_test_out_QMNIST))\n",
    "print(np.cov(score_test_out_QMNIST))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "iKdP-64sRyQ8"
   },
   "source": [
    "## Omniglot"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 970,
   "metadata": {
    "executionInfo": {
     "elapsed": 18,
     "status": "ok",
     "timestamp": 1694123298797,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "GNAQF4F4R9JQ"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 971,
   "metadata": {
    "executionInfo": {
     "elapsed": 17,
     "status": "ok",
     "timestamp": 1694123298797,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "bQdeByYMSFYz"
   },
   "outputs": [],
   "source": [
    "# test_dataset_Omniglot = torchvision.datasets.Omniglot(root='./data', download=True, transform=transform)\n",
    "# test_loader_Omniglot = torch.utils.data.DataLoader(test_dataset_QMNIST, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Omniglot, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 972,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 14513,
     "status": "ok",
     "timestamp": 1694123313293,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "rOznxhcjSMd0",
    "outputId": "bbf8f8f7-413a-4e3d-80ae-1ef8b3e30d18"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Files already downloaded and verified\n",
      "(19280, 196)\n"
     ]
    }
   ],
   "source": [
    "transform = transforms.Compose(\n",
    "    [transforms.Resize((28, 28)),  # Resize images to match the size of MNIST\n",
    "     transforms.ToTensor()])\n",
    "\n",
    "test_dataset_Omniglot = torchvision.datasets.Omniglot(root='./data', download=True, transform=transform)\n",
    "\n",
    "# Creating Dataloaders from the\n",
    "# training and testing dataset\n",
    "test_loader_Omniglot = torch.utils.data.DataLoader(test_dataset_Omniglot, batch_size=32460, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Omniglot:\n",
    "    img, _ = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_Omniglot = latent_test_out.detach().numpy()\n",
    "latent_test_out_Omniglot = latent_test_out_Omniglot.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Omniglot.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 973,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4349,
     "status": "ok",
     "timestamp": 1694123317618,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "2l0MVvcaSMfp",
    "outputId": "8f7a6d21-fcac-4108-fea7-31199f2ba966"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(19280, 500)\n",
      "[[  6 253 291 ... 224 139 298]\n",
      " [466 253 183 ... 224 153 290]\n",
      " [  6 336 183 ... 225 153 327]\n",
      " ...\n",
      " [  6 253 178 ... 469 153 290]\n",
      " [450 253 177 ... 263 139 298]\n",
      " [  6 253 177 ... 224 139 298]]\n",
      "0.5652618677354709\n",
      "0.004868972242066929\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Omniglot = et.apply(latent_test_out_Omniglot)\n",
    "\n",
    "print(leaves_test_out_Omniglot.shape)\n",
    "print(leaves_test_out_Omniglot)\n",
    "\n",
    "distances_test_out_Omniglot = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Omniglot[i,j] = hamming(leaves_test_out_Omniglot[i,:], leaves_test_out_Omniglot[j,:])\n",
    "\n",
    "score_test_out_Omniglot = sum(distances_test_out_Omniglot)/499\n",
    "\n",
    "print(np.mean(score_test_out_Omniglot))\n",
    "print(np.cov(score_test_out_Omniglot))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "u9OZcvTSXkPh"
   },
   "source": [
    "## Cifar10bw"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 974,
   "metadata": {
    "executionInfo": {
     "elapsed": 23,
     "status": "ok",
     "timestamp": 1694123317619,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "QfMu7Z3kXol1"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 975,
   "metadata": {
    "executionInfo": {
     "elapsed": 20,
     "status": "ok",
     "timestamp": 1694123317619,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "Ej9JmeDhX0NG"
   },
   "outputs": [],
   "source": [
    "# test_dataset_Cifar10bw = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform)\n",
    "# test_loader_Cifar10bw = torch.utils.data.DataLoader(test_dataset_Cifar10bw, batch_size = 64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_Cifar10bw, criterion, optimizer, num_epochs=num_epoch, online=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 976,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 6661,
     "status": "ok",
     "timestamp": 1694123324260,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "96LUcE1kXon3",
    "outputId": "279826eb-fdec-4189-8598-cd733258b4c0"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Files already downloaded and verified\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "transform = transforms.Compose(\n",
    "    [transforms.Resize((28, 28)),  # Resize images to match the size of MNIST\n",
    "     transforms.ToTensor()])\n",
    "\n",
    "test_dataset_Cifar10bw = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform)\n",
    "\n",
    "# Creating Dataloaders from the\n",
    "# training and testing dataset\n",
    "test_loader_Cifar10bw = torch.utils.data.DataLoader(test_dataset_Cifar10bw, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_Cifar10bw:\n",
    "    img, _ = batch\n",
    "    img = torchvision.transforms.Grayscale(num_output_channels=1)(img)\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_Cifar10bw = latent_test_out.detach().numpy()\n",
    "latent_test_out_Cifar10bw = latent_test_out_Cifar10bw.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Cifar10bw.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 977,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4521,
     "status": "ok",
     "timestamp": 1694123328767,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "-9ekzdVoYJIH",
    "outputId": "48909e86-2071-4c95-ff8f-501447d4caf7"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[466 253 183 ... 215 163 290]\n",
      " [  6 336 164 ... 210 127 290]\n",
      " [  6 253 183 ... 193 139 298]\n",
      " ...\n",
      " [  6 101 175 ... 210 163 290]\n",
      " [  6 336 177 ... 193 153 298]\n",
      " [446 273 178 ... 192 203 244]]\n",
      "0.752224496993988\n",
      "0.006190605020545569\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Cifar10bw = et.apply(latent_test_out_Cifar10bw)\n",
    "\n",
    "print(leaves_test_out_Cifar10bw.shape)\n",
    "print(leaves_test_out_Cifar10bw)\n",
    "\n",
    "distances_test_out_Cifar10bw = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Cifar10bw[i,j] = hamming(leaves_test_out_Cifar10bw[i,:], leaves_test_out_Cifar10bw[j,:])\n",
    "\n",
    "score_test_out_Cifar10bw = sum(distances_test_out_Cifar10bw)/499\n",
    "\n",
    "print(np.mean(score_test_out_Cifar10bw))\n",
    "print(np.cov(score_test_out_Cifar10bw))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "WDCNJ2thdelj"
   },
   "source": [
    "## NotMNIST"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 978,
   "metadata": {
    "executionInfo": {
     "elapsed": 25,
     "status": "ok",
     "timestamp": 1694123328768,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "hhMEPlqad6cl"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 979,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 2447,
     "status": "ok",
     "timestamp": 1694123331192,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "7HUmXsizdh0T",
    "outputId": "1dc3a976-861c-4a62-9ac7-c16debeff7b7"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(500, 1, 28, 28)\n"
     ]
    }
   ],
   "source": [
    "from pims import ImageSequence\n",
    "from PIL import Image\n",
    "\n",
    "images_A = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/A/*.png')\n",
    "images_B = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/B/*.png')\n",
    "images_C = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/C/*.png')\n",
    "images_D = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/D/*.png')\n",
    "images_E = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/E/*.png')\n",
    "images_F = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/F/*.png')\n",
    "images_G = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/G/*.png')\n",
    "images_H = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/H/*.png')\n",
    "images_I = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/I/*.png')\n",
    "images_J = ImageSequence('/content/gdrive/MyDrive/TOOD/datasets/NotMNIST_small/J/*.png')\n",
    "\n",
    "X_data_A = np.zeros((50, 28**2))\n",
    "X_data_B = np.zeros((50, 28**2))\n",
    "X_data_C = np.zeros((50, 28**2))\n",
    "X_data_D = np.zeros((50, 28**2))\n",
    "X_data_E = np.zeros((50, 28**2))\n",
    "X_data_F = np.zeros((50, 28**2))\n",
    "X_data_G = np.zeros((50, 28**2))\n",
    "X_data_H = np.zeros((50, 28**2))\n",
    "X_data_I = np.zeros((50, 28**2))\n",
    "X_data_J = np.zeros((50, 28**2))\n",
    "\n",
    "for i in range(50):\n",
    "    X_data_A[i,:] = np.reshape(np.array(images_A[i]), (1,28**2))/255\n",
    "    X_data_B[i,:] = np.reshape(np.array(images_B[i]), (1,28**2))/255\n",
    "    X_data_C[i,:] = np.reshape(np.array(images_C[i]), (1,28**2))/255\n",
    "    X_data_D[i,:] = np.reshape(np.array(images_D[i]), (1,28**2))/255\n",
    "    X_data_E[i,:] = np.reshape(np.array(images_E[i]), (1,28**2))/255\n",
    "    X_data_F[i,:] = np.reshape(np.array(images_F[i]), (1,28**2))/255\n",
    "    X_data_G[i,:] = np.reshape(np.array(images_G[i]), (1,28**2))/255\n",
    "    X_data_H[i,:] = np.reshape(np.array(images_H[i]), (1,28**2))/255\n",
    "    X_data_I[i,:] = np.reshape(np.array(images_I[i]), (1,28**2))/255\n",
    "    X_data_J[i,:] = np.reshape(np.array(images_J[i]), (1,28**2))/255\n",
    "\n",
    "\n",
    "X_test_out = np.vstack([X_data_A, X_data_B, X_data_C, X_data_D, X_data_E, X_data_F, X_data_G, X_data_H, X_data_I, X_data_J])\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "print(X_test_out.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 980,
   "metadata": {
    "executionInfo": {
     "elapsed": 2,
     "status": "ok",
     "timestamp": 1694123331192,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "QtoumAYBdh4P"
   },
   "outputs": [],
   "source": [
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# test_loader_NotMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, test_loader_NotMNIST, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 981,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 14872,
     "status": "ok",
     "timestamp": 1694123346062,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "vqZPvS-3dh7k",
    "outputId": "74bb38eb-e527-40ad-c7a3-1f3fc3c51711"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(7280, 196)\n"
     ]
    }
   ],
   "source": [
    "test_loader_NotMNIST = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=10000, shuffle=True)\n",
    "\n",
    "for batch in test_loader_NotMNIST:\n",
    "\n",
    "    img = batch\n",
    "    #img = img.reshape(-1,1,28,28)\n",
    "\n",
    "    # Generating output\n",
    "    ##out = model.forward(img)\n",
    "\n",
    "    out = model.forward(img)\n",
    "    img.requires_grad = True\n",
    "    loss = criterion(out, img)\n",
    "    model.zero_grad()\n",
    "    loss.backward()\n",
    "    gradient = img.grad.data.sign()\n",
    "    img = img + 0.1 * gradient\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "    ##latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "latent_test_out_NotMNIST = latent_test_out.detach().numpy()\n",
    "latent_test_out_NotMNIST = latent_test_out_NotMNIST.reshape(-1,4*7*7)\n",
    "print(latent_test_out_NotMNIST.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 982,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4695,
     "status": "ok",
     "timestamp": 1694123350754,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "34usMYYqdh8u",
    "outputId": "c2884d05-005a-4cc6-b7e7-94a972af58bc"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(7280, 500)\n",
      "[[450  44 130 ...  19 201  28]\n",
      " [  5  44 167 ... 175 116  10]\n",
      " [  5  46 279 ...  19 201  25]\n",
      " ...\n",
      " [  5  47 279 ...  11 422 397]\n",
      " [358 400 164 ... 196 121 298]\n",
      " [358  44 317 ...  19  63  25]]\n",
      "0.8209897715430862\n",
      "0.0016744257599869408\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_NotMNIST = et.apply(latent_test_out_NotMNIST)\n",
    "\n",
    "print(leaves_test_out_NotMNIST.shape)\n",
    "print(leaves_test_out_NotMNIST)\n",
    "\n",
    "distances_test_out_NotMNIST = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_NotMNIST[i,j] = hamming(leaves_test_out_NotMNIST[i,:], leaves_test_out_NotMNIST[j,:])\n",
    "\n",
    "score_test_out_NotMNIST = sum(distances_test_out_NotMNIST)/499\n",
    "\n",
    "print(np.mean(score_test_out_NotMNIST))\n",
    "print(np.cov(score_test_out_NotMNIST))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 982,
   "metadata": {
    "executionInfo": {
     "elapsed": 24,
     "status": "ok",
     "timestamp": 1694123350754,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "SniWCeDXdh99"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "tamsyBx9xv2t"
   },
   "source": [
    "## Gaussian"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 983,
   "metadata": {
    "executionInfo": {
     "elapsed": 24,
     "status": "ok",
     "timestamp": 1694123350755,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "efiYSL3HjJa5"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 984,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 1132,
     "status": "ok",
     "timestamp": 1694123351864,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "qAcmKgItEge1",
    "outputId": "86ebe8e3-b8e9-4d3e-e394-e9474731c173"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 784)\n",
      "(10000, 1, 28, 28)\n"
     ]
    }
   ],
   "source": [
    "# Gaussian random noise\n",
    "mean_test_out = np.random.uniform(low=0,high=1,size=784)\n",
    "cov_test_out = np.random.rand(784,784)\n",
    "cov_test_out = np.matmul(cov_test_out, cov_test_out.T)\n",
    "X_test_out = np.random.multivariate_normal(mean_test_out, cov_test_out, 10000)\n",
    "X_test_out = MinMaxScaler().fit_transform(X_test_out)\n",
    "print(X_test_out.shape)\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "print(X_test_out.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 985,
   "metadata": {
    "executionInfo": {
     "elapsed": 2,
     "status": "ok",
     "timestamp": 1694123351864,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "i1d4sx8MitCF"
   },
   "outputs": [],
   "source": [
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# train_loader_Gaussian = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, train_loader_Gaussian, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 986,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 897,
     "status": "ok",
     "timestamp": 1694123352759,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "QxSu2wMBxyYr",
    "outputId": "f280ea87-f02e-4805-a7e7-90fa901269d3"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 4, 7, 7)\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=10000)\n",
    "\n",
    "for batch in test_loader:\n",
    "    img = batch\n",
    "    img = img.reshape(-1,1,28,28)\n",
    "    # Generating output\n",
    "    #out = model.forward(img)\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_Gaussian = latent_test_out.detach().numpy()\n",
    "print(latent_test_out_Gaussian.shape)\n",
    "latent_test_out_Gaussian = latent_test_out_Gaussian.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Gaussian.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 987,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 3732,
     "status": "ok",
     "timestamp": 1694123356488,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "l24-4OTyxyaj",
    "outputId": "eee37a96-6b67-4260-a353-8880d7598708"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[  6 253 177 ... 193 139 290]\n",
      " [  6 253 177 ... 189 127 290]\n",
      " [  6 253 177 ... 189 127 290]\n",
      " ...\n",
      " [  6 253 177 ... 189 121 290]\n",
      " [  6 253 177 ... 193 139 290]\n",
      " [  6 253 177 ... 215 139 290]]\n",
      "0.28608115430861725\n",
      "0.003714976443165419\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Gaussian = et.apply(latent_test_out_Gaussian)\n",
    "\n",
    "print(leaves_test_out_Gaussian.shape)\n",
    "print(leaves_test_out_Gaussian)\n",
    "\n",
    "distances_test_out_Gaussian = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Gaussian[i,j] = hamming(leaves_test_out_Gaussian[i,:], leaves_test_out_Gaussian[j,:])\n",
    "\n",
    "score_test_out_Gaussian = sum(distances_test_out_Gaussian)/499\n",
    "\n",
    "print(np.mean(score_test_out_Gaussian))\n",
    "print(np.cov(score_test_out_Gaussian))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "4Zs0-6kFybMM"
   },
   "source": [
    "## Uniform"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 988,
   "metadata": {
    "executionInfo": {
     "elapsed": 22,
     "status": "ok",
     "timestamp": 1694123356490,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "BHdD_LxEjNmI"
   },
   "outputs": [],
   "source": [
    "# model_Conv_AE_OOD_MNIST_train_30 = 'classifier.pt'\n",
    "# path = \"/content/gdrive/My Drive/{model_Conv_AE_OOD_MNIST_train_30}\"\n",
    "# model.load_state_dict(torch.load(path))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 989,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 20,
     "status": "ok",
     "timestamp": 1694123356490,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "6b5z_lW8xycj",
    "outputId": "caf1016a-4e8d-4b5c-a76b-05dec538da9e"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 784)\n",
      "(10000, 1, 28, 28)\n"
     ]
    }
   ],
   "source": [
    "# Uniform random noise\n",
    "x_min = [0]*784\n",
    "x_max = [1]*784\n",
    "X_test_out = np.random.uniform(low=x_min, high=x_max, size=(10000,784))\n",
    "X_test_out = MinMaxScaler().fit_transform(X_test_out)\n",
    "print(X_test_out.shape)\n",
    "X_test_out = X_test_out.reshape((-1,1,28,28))\n",
    "print(X_test_out.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 990,
   "metadata": {
    "executionInfo": {
     "elapsed": 450,
     "status": "ok",
     "timestamp": 1694123356923,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "X6MhxpC2jQU2"
   },
   "outputs": [],
   "source": [
    "# X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "# train_loader_Uniform = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=64, shuffle=True)\n",
    "\n",
    "# # model = ConvAutoencoder()\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# train(model, train_loader_Uniform, criterion, optimizer, num_epochs=num_epoch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 991,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 976,
     "status": "ok",
     "timestamp": 1694123357897,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "BG0fLErIxyeZ",
    "outputId": "779d28cb-418b-4bae-afa2-2f4076f8f163"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 4, 7, 7)\n",
      "(10000, 196)\n"
     ]
    }
   ],
   "source": [
    "X_test_out_tensor = torch.tensor(X_test_out, dtype=torch.float32)\n",
    "test_loader = torch.utils.data.DataLoader(X_test_out_tensor, batch_size=10000)\n",
    "\n",
    "for batch in test_loader:\n",
    "    img = batch\n",
    "    img = img.reshape(-1,1,28,28)\n",
    "    # Generating output\n",
    "    #out = model.forward(img)\n",
    "    latent_test_out = model.forward_encoder(img)\n",
    "\n",
    "\n",
    "latent_test_out_Uniform = latent_test_out.detach().numpy()\n",
    "print(latent_test_out_Uniform.shape)\n",
    "latent_test_out_Uniform = latent_test_out_Uniform.reshape(-1,4*7*7)\n",
    "print(latent_test_out_Uniform.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 992,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 4113,
     "status": "ok",
     "timestamp": 1694123362007,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "FvwHsDP5yif8",
    "outputId": "4f1794e0-8e6c-4bf8-8f34-06dcfb7efdfe"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10000, 500)\n",
      "[[  6 253 172 ... 189 139 290]\n",
      " [  6 253 177 ... 193 139 290]\n",
      " [  6 253 172 ... 189 139 290]\n",
      " ...\n",
      " [  6 253 172 ... 215 151 290]\n",
      " [  6 253 172 ... 193 195 290]\n",
      " [  6 336 172 ... 189 127 290]]\n",
      "0.35705949498998013\n",
      "0.000598866421107132\n"
     ]
    }
   ],
   "source": [
    "leaves_test_out_Uniform = et.apply(latent_test_out_Uniform)\n",
    "\n",
    "print(leaves_test_out_Uniform.shape)\n",
    "print(leaves_test_out_Uniform)\n",
    "\n",
    "distances_test_out_Uniform = np.zeros((500,500))\n",
    "\n",
    "for i in range(500):\n",
    "    for j in range(500):\n",
    "        distances_test_out_Uniform[i,j] = hamming(leaves_test_out_Uniform[i,:], leaves_test_out_Uniform[j,:])\n",
    "\n",
    "score_test_out_Uniform = sum(distances_test_out_Uniform)/499\n",
    "\n",
    "print(np.mean(score_test_out_Uniform))\n",
    "print(np.cov(score_test_out_Uniform))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 992,
   "metadata": {
    "executionInfo": {
     "elapsed": 18,
     "status": "ok",
     "timestamp": 1694123362007,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "N_CKgEZ1yiju"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 992,
   "metadata": {
    "executionInfo": {
     "elapsed": 17,
     "status": "ok",
     "timestamp": 1694123362007,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "nxm_k1Noyil7"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "FZGej4gIyhMD"
   },
   "source": [
    "# Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 994,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 12,
     "status": "ok",
     "timestamp": 1694123362431,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "xMKKU1PywASB",
    "outputId": "7f443249-d8c3-4769-f996-213b8435970e"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1.0\n",
      "0.997516\n",
      "0.99312\n",
      "1.0\n",
      "0.8372759999999999\n",
      "0.904878\n",
      "0.8894240000000001\n",
      "1.0\n",
      "0.999868\n",
      "0.99434\n",
      "1.0\n",
      "1.0\n",
      "0.994568\n",
      "1.0\n",
      "1.0\n",
      "1.0\n"
     ]
    }
   ],
   "source": [
    "score_pred_Breast = np.concatenate([score_test_in, score_test_out_Breast])\n",
    "score_pred_Chest = np.concatenate([score_test_in, score_test_out_Chest])\n",
    "score_pred_Oct = np.concatenate([score_test_in, score_test_out_Oct])\n",
    "score_pred_Organa = np.concatenate([score_test_in, score_test_out_Organa])\n",
    "score_pred_Organc = np.concatenate([score_test_in, score_test_out_Organc])\n",
    "score_pred_Organs = np.concatenate([score_test_in, score_test_out_Organs])\n",
    "score_pred_Pneum = np.concatenate([score_test_in, score_test_out_Pneum])\n",
    "score_pred_Tissue = np.concatenate([score_test_in, score_test_out_Tissue])\n",
    "score_pred_KMNIST = np.concatenate([score_test_in, score_test_out_KMNIST])\n",
    "score_pred_QMNIST = np.concatenate([score_test_in, score_test_out_QMNIST])\n",
    "score_pred_Omniglot = np.concatenate([score_test_in, score_test_out_Omniglot])\n",
    "score_pred_Cifar10bw = np.concatenate([score_test_in, score_test_out_Cifar10bw])\n",
    "score_pred_NotMNIST = np.concatenate([score_test_in, score_test_out_NotMNIST])\n",
    "score_pred_Gaussian = np.concatenate([score_test_in, score_test_out_Gaussian])\n",
    "score_pred_Uniform = np.concatenate([score_test_in, score_test_out_Uniform])\n",
    "score_true = np.concatenate([np.ones(500), np.zeros(500)])\n",
    "\n",
    "print(roc_auc_score(score_true, score_pred_Fashion))\n",
    "print(roc_auc_score(score_true, score_pred_Breast))\n",
    "print(roc_auc_score(score_true, score_pred_Chest))\n",
    "print(roc_auc_score(score_true, score_pred_Oct))\n",
    "print(roc_auc_score(score_true, score_pred_Organa))\n",
    "print(roc_auc_score(score_true, score_pred_Organc))\n",
    "print(roc_auc_score(score_true, score_pred_Organs))\n",
    "print(roc_auc_score(score_true, score_pred_Pneum))\n",
    "print(roc_auc_score(score_true, score_pred_Tissue))\n",
    "print(roc_auc_score(score_true, score_pred_KMNIST))\n",
    "print(roc_auc_score(score_true, score_pred_QMNIST))\n",
    "print(roc_auc_score(score_true, score_pred_Omniglot))\n",
    "print(roc_auc_score(score_true, score_pred_Cifar10bw))\n",
    "print(roc_auc_score(score_true, score_pred_NotMNIST))\n",
    "print(roc_auc_score(score_true, score_pred_Gaussian))\n",
    "print(roc_auc_score(score_true, score_pred_Uniform))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 995,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 11,
     "status": "ok",
     "timestamp": 1694123362432,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "77iJeZtfwYyj",
    "outputId": "241ea30d-4a8a-42c0-f554-872254f422be"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1.0\n",
      "0.9970073287925589\n",
      "0.9791152869534225\n",
      "1.0\n",
      "0.7727615803676721\n",
      "0.8314291529910411\n",
      "0.8245685390174654\n",
      "1.0\n",
      "0.999863724292722\n",
      "0.9937025007114986\n",
      "1.0\n",
      "1.0\n",
      "0.9936579215039639\n",
      "1.0\n",
      "1.0\n",
      "1.0\n"
     ]
    }
   ],
   "source": [
    "precision_Breast, recall_Breast, thresholds_Breast = precision_recall_curve(score_true, score_pred_Breast)\n",
    "precision_Chest, recall_Chest, thresholds_Chest = precision_recall_curve(score_true, score_pred_Chest)\n",
    "precision_Oct, recall_Oct, thresholds_Oct = precision_recall_curve(score_true, score_pred_Oct)\n",
    "precision_Organa, recall_Organa, thresholds_Organa = precision_recall_curve(score_true, score_pred_Organa)\n",
    "precision_Organc, recall_Organc, thresholds_Organc = precision_recall_curve(score_true, score_pred_Organc)\n",
    "precision_Organs, recall_Organs, thresholds_Organs = precision_recall_curve(score_true, score_pred_Organs)\n",
    "precision_Pneum, recall_Pneum, thresholds_Pneum = precision_recall_curve(score_true, score_pred_Pneum)\n",
    "precision_Tissue, recall_Tissue, thresholds_Tissue = precision_recall_curve(score_true, score_pred_Tissue)\n",
    "precision_KMNIST, recall_KMNIST, thresholds_KMNIST = precision_recall_curve(score_true, score_pred_KMNIST)\n",
    "precision_QMNIST, recall_QMNIST, thresholds_QMNIST = precision_recall_curve(score_true, score_pred_QMNIST)\n",
    "precision_Omniglot, recall_Omniglot, thresholds_Omniglot = precision_recall_curve(score_true, score_pred_Omniglot)\n",
    "precision_Cifar10bw, recall_Cifar10bw, threshold_Cifar10bw = precision_recall_curve(score_true, score_pred_Cifar10bw)\n",
    "precision_NotMNIST, recall_NotMNIST, thresholds_NotMNIST = precision_recall_curve(score_true, score_pred_NotMNIST)\n",
    "precision_Gaussian, recall_Gaussian, thresholds_Gaussian = precision_recall_curve(score_true, score_pred_Gaussian)\n",
    "precision_Uniform, recall_Uniform, thresholds_Uniform = precision_recall_curve(score_true, score_pred_Uniform)\n",
    "\n",
    "auc_precision_recall_Breast = auc(recall_Breast, precision_Breast)\n",
    "auc_precision_recall_Chest = auc(recall_Chest, precision_Chest)\n",
    "auc_precision_recall_Oct = auc(recall_Oct, precision_Oct)\n",
    "auc_precision_recall_Organa = auc(recall_Organa, precision_Organa)\n",
    "auc_precision_recall_Organc = auc(recall_Organc, precision_Organc)\n",
    "auc_precision_recall_Organs = auc(recall_Organs, precision_Organs)\n",
    "auc_precision_recall_Pneum = auc(recall_Pneum, precision_Pneum)\n",
    "auc_precision_recall_Tissue = auc(recall_Tissue, precision_Tissue)\n",
    "auc_precision_recall_KMNIST = auc(recall_KMNIST, precision_KMNIST)\n",
    "auc_precision_recall_QMNIST = auc(recall_QMNIST, precision_QMNIST)\n",
    "auc_precision_recall_Omniglot = auc(recall_Omniglot, precision_Omniglot)\n",
    "auc_precision_recall_Cifar10bw = auc(recall_Cifar10bw, precision_Cifar10bw)\n",
    "auc_precision_recall_NotMNIST = auc(recall_NotMNIST, precision_NotMNIST)\n",
    "auc_precision_recall_Gaussian = auc(recall_Gaussian, precision_Gaussian)\n",
    "auc_precision_recall_Uniform = auc(recall_Uniform, precision_Uniform)\n",
    "\n",
    "print(auc_precision_recall_Breast)\n",
    "print(auc_precision_recall_Chest)\n",
    "print(auc_precision_recall_Oct)\n",
    "print(auc_precision_recall_Organa)\n",
    "print(auc_precision_recall_Organc)\n",
    "print(auc_precision_recall_Organs)\n",
    "print(auc_precision_recall_Pneum)\n",
    "print(auc_precision_recall_Tissue)\n",
    "print(auc_precision_recall_KMNIST)\n",
    "print(auc_precision_recall_QMNIST)\n",
    "print(auc_precision_recall_Omniglot)\n",
    "print(auc_precision_recall_Cifar10bw)\n",
    "print(auc_precision_recall_NotMNIST)\n",
    "print(auc_precision_recall_Gaussian)\n",
    "print(auc_precision_recall_Uniform)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 996,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 804,
     "status": "ok",
     "timestamp": 1694123363228,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "IW5FtpbMWrGf",
    "outputId": "069a2bc2-1854-4921-b7be-75a7ec7b1b99"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.0\n",
      "0.008\n",
      "0.012\n",
      "0.0\n",
      "0.288\n",
      "0.18\n",
      "0.184\n",
      "0.0\n",
      "0.0\n",
      "0.026\n",
      "0.0\n",
      "0.0\n",
      "0.0\n",
      "0.02\n",
      "0.0\n",
      "0.0\n"
     ]
    }
   ],
   "source": [
    "def compute_fpr95(y_true, y_pred_probs):\n",
    "    fpr, tpr, thresholds = sklearn.metrics.roc_curve(y_true, y_pred_probs)\n",
    "    idx = np.abs(tpr - 0.95).argmin()\n",
    "    fpr95 = fpr[idx]\n",
    "    return fpr95\n",
    "\n",
    "# Example usage\n",
    "# Assuming you have y_true (true labels) and y_pred_probs (predicted probabilities)\n",
    "fpr95_score_Breast = compute_fpr95(score_true, score_pred_Breast)\n",
    "fpr95_score_Chest = compute_fpr95(score_true, score_pred_Chest)\n",
    "fpr95_score_Oct = compute_fpr95(score_true, score_pred_Oct)\n",
    "fpr95_score_Organa = compute_fpr95(score_true, score_pred_Organa)\n",
    "fpr95_score_Organc = compute_fpr95(score_true, score_pred_Organc)\n",
    "fpr95_score_Organs = compute_fpr95(score_true, score_pred_Organs)\n",
    "fpr95_score_Pneum = compute_fpr95(score_true, score_pred_Pneum)\n",
    "fpr95_score_Tissue = compute_fpr95(score_true, score_pred_Tissue)\n",
    "fpr95_score_KMNIST = compute_fpr95(score_true, score_pred_KMNIST)\n",
    "fpr95_score_QMNIST = compute_fpr95(score_true, score_pred_QMNIST)\n",
    "fpr95_score_Omniglot = compute_fpr95(score_true, score_pred_Omniglot)\n",
    "fpr95_score_NotMNIST = compute_fpr95(score_true, score_pred_NotMNIST)\n",
    "fpr95_score_Cifar10bw = compute_fpr95(score_true, score_pred_Cifar10bw)\n",
    "fpr95_score_Gaussian = compute_fpr95(score_true, score_pred_Gaussian)\n",
    "fpr95_score_Uniform = compute_fpr95(score_true, score_pred_Uniform)\n",
    "\n",
    "print(fpr95_score_Breast)\n",
    "print(fpr95_score_Chest)\n",
    "print(fpr95_score_Oct)\n",
    "print(fpr95_score_Organa)\n",
    "print(fpr95_score_Organc)\n",
    "print(fpr95_score_Organs)\n",
    "print(fpr95_score_Pneum)\n",
    "print(fpr95_score_Tissue)\n",
    "print(fpr95_score_KMNIST)\n",
    "print(fpr95_score_QMNIST)\n",
    "print(fpr95_score_Omniglot)\n",
    "print(fpr95_score_NotMNIST)\n",
    "print(fpr95_score_Cifar10bw)\n",
    "print(fpr95_score_Uniform)\n",
    "print(fpr95_score_Gaussian)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 996,
   "metadata": {
    "executionInfo": {
     "elapsed": 803,
     "status": "ok",
     "timestamp": 1694123363228,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "gZKuFE86Ey0O"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 997,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 12,
     "status": "ok",
     "timestamp": 1694123363229,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "9Lltqc9pEy3V",
    "outputId": "5737a9db-42f5-40b4-cc4e-3b8b7a81280b"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.9676757194388776 0.015277791051508323\n",
      "0.7290740681362725 0.054224058728752134\n",
      "0.757487871743487 0.06318870892600097\n",
      "0.7052959839679358 0.0783057643530629\n",
      "0.7772529378757516 0.04238601116454942\n",
      "0.8572637274549102 0.08541532714920053\n",
      "0.8289275511022047 0.08963767968435297\n",
      "0.8284305571142286 0.08957000334025988\n",
      "0.511020889779559 0.06506654475211567\n",
      "0.8148208737474949 0.04174355299385855\n",
      "0.8934494589178358 0.028244143987911623\n",
      "0.7437405210420841 0.049393245367634696\n",
      "0.5652618677354709 0.06977802119626873\n",
      "0.752224496993988 0.0786803979434876\n",
      "0.8209897715430862 0.040919747799649756\n",
      "0.28608115430861725 0.06095060658570527\n",
      "0.35705949498998013 0.02447174740608304\n"
     ]
    }
   ],
   "source": [
    "print(np.mean(score_test_in), np.sqrt(np.cov(score_test_in)))\n",
    "print(np.mean(score_test_out_Breast), np.sqrt(np.cov(score_test_out_Breast)))\n",
    "print(np.mean(score_test_out_Chest), np.sqrt(np.cov(score_test_out_Chest)))\n",
    "print(np.mean(score_test_out_Oct), np.sqrt(np.cov(score_test_out_Oct)))\n",
    "print(np.mean(score_test_out_Organa), np.sqrt(np.cov(score_test_out_Organa)))\n",
    "print(np.mean(score_test_out_Organc), np.sqrt(np.cov(score_test_out_Organc)))\n",
    "print(np.mean(score_test_out_Organs), np.sqrt(np.cov(score_test_out_Organs)))\n",
    "print(np.mean(score_test_out_Pneum), np.sqrt(np.cov(score_test_out_Pneum)))\n",
    "print(np.mean(score_test_out_Tissue), np.sqrt(np.cov(score_test_out_Tissue)))\n",
    "print(np.mean(score_test_out_KMNIST), np.sqrt(np.cov(score_test_out_KMNIST)))\n",
    "print(np.mean(score_test_out_QMNIST), np.sqrt(np.cov(score_test_out_QMNIST)))\n",
    "print(np.mean(score_test_out_Omniglot), np.sqrt(np.cov(score_test_out_Omniglot)))\n",
    "print(np.mean(score_test_out_Cifar10bw), np.sqrt(np.cov(score_test_out_Cifar10bw)))\n",
    "print(np.mean(score_test_out_NotMNIST), np.sqrt(np.cov(score_test_out_NotMNIST)))\n",
    "print(np.mean(score_test_out_Gaussian), np.sqrt(np.cov(score_test_out_Gaussian)))\n",
    "print(np.mean(score_test_out_Uniform), np.sqrt(np.cov(score_test_out_Uniform)))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 999,
   "metadata": {
    "executionInfo": {
     "elapsed": 10,
     "status": "ok",
     "timestamp": 1694123363229,
     "user": {
      "displayName": "Zhaiming Shen",
      "userId": "12760861740580065439"
     },
     "user_tz": 240
    },
    "id": "BQQOs20XAERs"
   },
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "qyjuDTOXQ4J3"
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "colab": {
   "authorship_tag": "ABX9TyPlhfuug6iB06z1HInJwb/Z",
   "machine_shape": "hm",
   "provenance": [
    {
     "file_id": "1el3O14CTxaG4HSenMnLS_BlexLv84Hth",
     "timestamp": 1694109556821
    },
    {
     "file_id": "1Fp5qny4ygd5s_dco0cnOGx4MohZmAEiT",
     "timestamp": 1690739976595
    }
   ]
  },
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
