{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "a4aa2828-b07d-4c29-b024-02863383942b",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "import os\n",
    "\n",
    "import matplotlib.pyplot as plt\n",
    "import numpy as np\n",
    "from tqdm import tqdm\n",
    "import pandas as pd\n",
    "from IPython.display import HTML\n",
    "\n",
    "import torch\n",
    "import torchvision\n",
    "from torchvision.datasets import CIFAR100\n",
    "from torchvision import transforms\n",
    "import clip\n",
    "import calibration as cal\n",
    "from torch.nn import functional as F\n",
    "from torch import nn, optim\n",
    "\n",
    "from src.data import *\n",
    "from src.utils import *\n",
    "from src.models import *\n",
    "\n",
    "from dataclasses import dataclass"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "bee01b68-595c-483f-9ce8-a6d6ccf50a8f",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "def run_exp(args):\n",
    "    \n",
    "    seed_all(seed = args.seed)\n",
    "    \n",
    "    n_val_samples = args.n_val_samples\n",
    "    n_test_samples = args.n_test_samples\n",
    "    \n",
    "    args.is_wilds = is_wilds(args.dataset)\n",
    "    split = args.val_split\n",
    "\n",
    "    if not args.is_wilds:\n",
    "        if (args.dataset, args.model, split) in save_data:\n",
    "            val_dataset = load_dataset_from_store(args.dataset, args.model, split)\n",
    "        else:\n",
    "            raise ValueError\n",
    "    else:\n",
    "        if (args.dataset, args.model, split) in save_data:\n",
    "            val_dataset = load_wilds_dataset(args, split)\n",
    "        else:  \n",
    "            raise ValueError\n",
    "            \n",
    "    test_dataset = val_dataset.random_split(n_samples=n_val_samples)\n",
    "    val_data_loader = dataloader_from_dataset(val_dataset, args)\n",
    "    test_data_loader = dataloader_from_dataset(test_dataset, args)\n",
    "\n",
    "    test_dataset.random_sample(n_samples=n_test_samples)\n",
    "    args.input_feature_dim = val_dataset.features.shape[-1]\n",
    "    \n",
    "    if args.scaling == \"platt\":\n",
    "\n",
    "        mix_source_h = train_h(val_dataset)\n",
    "        mix_source_w = mix_source_h.clf.coef_[0][0]\n",
    "        mix_source_b = mix_source_h.clf.intercept_[0]\n",
    "        mix_source_w, mix_source_b\n",
    "\n",
    "    elif args.scaling == \"temp\":\n",
    "        \n",
    "        temp_scaler = ModelWithTemperature()\n",
    "        temp_scaler.set_temperature(val_dataset)\n",
    "        temp_scaler.eval()\n",
    "        mix_source_h = temp_scaler\n",
    "        mix_source_w = temp_scaler.temperature.item()\n",
    "        mix_source_b = None\n",
    "        \n",
    "    print(\"w, b:\", mix_source_w, mix_source_b)\n",
    "    print(\"\\nUncalibrated Validation\")\n",
    "    val_dataset.measure_calibration()\n",
    "    # print(\"Calibrate Validation Using Validation\")\n",
    "    # val_dataset.measure_calibration(h=mix_source_h, h_type=args.scaling)\n",
    "    # print(\"Val Accuracy\")\n",
    "    # val_dataset.measure_accuracy()\n",
    "    print(\"\\nUncalibrated OOD Test\")\n",
    "    test_uncal_scores = test_dataset.measure_calibration()\n",
    "    print(\"Calibrate Test Using Validation\")\n",
    "    test_cal_scores = test_dataset.measure_calibration(h=mix_source_h, h_type=args.scaling)\n",
    "    # print(\"OOD Test Accuracy\")\n",
    "    # test_dataset.measure_accuracy()\n",
    "    print()\n",
    "    \n",
    "    val_conf = np.max(val_dataset.probs, -1)\n",
    "    val_y_hat = np.argmax(val_dataset.probs, -1)\n",
    "    val_y_correct = np.array((val_y_hat==val_dataset.labels), dtype=int)\n",
    "    \n",
    "    print(\"Histogram Binning\")\n",
    "    h = cal.HistogramTopCalibrator(val_dataset.probs.shape[0], num_bins=15)\n",
    "    h.train_calibration(val_dataset.probs, val_dataset.labels)\n",
    "    hist_bin_scores = test_dataset.measure_calibration(h=h, h_type=\"platt\")\n",
    "    \n",
    "    print(\"Platt Binning\")\n",
    "    h = cal.PlattBinnerTopCalibrator(val_dataset.probs.shape[0], num_bins=15)\n",
    "    h.train_calibration(val_dataset.probs, val_dataset.labels)\n",
    "    platt_bin_scores = test_dataset.measure_calibration(h=h, h_type=\"platt\")\n",
    "    \n",
    "    res = [\n",
    "        (\"Histogram Binner\", hist_bin_scores[\"ECE-1\"], hist_bin_scores[\"ECE-2\"]),\n",
    "        (\"Platt Binner\", platt_bin_scores[\"ECE-1\"], platt_bin_scores[\"ECE-2\"]),\n",
    "        (args.scaling.capitalize()+\" Scaling\", test_cal_scores[\"ECE-1\"], test_cal_scores[\"ECE-2\"]),\n",
    "    ]\n",
    "    \n",
    "    if args.scaling == \"temp\":\n",
    "        print(\"Platt Scaling\")\n",
    "        h = cal.PlattTopCalibrator(val_dataset.probs.shape[0], num_bins=15)\n",
    "        h.train_calibration(val_dataset.probs, val_dataset.labels)\n",
    "        platt_scores = test_dataset.measure_calibration(h=h, h_type=\"platt\")\n",
    "        res.append((\"Platt Scaling\", platt_scores[\"ECE-1\"], platt_scores[\"ECE-2\"]))\n",
    "        \n",
    "    res.append((\"Uncalibrated\", test_uncal_scores[\"ECE-1\"], test_uncal_scores[\"ECE-2\"]),)\n",
    "    \n",
    "    return res\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "dfec1bb5-32b0-402e-abb3-da3d09594c88",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "@dataclass\n",
    "class Args:\n",
    "    model: str\n",
    "    dataset: str\n",
    "    val_split: str\n",
    "    sel_losses: list\n",
    "    # test_split: str\n",
    "    cov_loss: str=\"quad\"\n",
    "    scaling: str=\"platt\"\n",
    "    n_epoch: int=2\n",
    "    coverage_weight: float=0.01\n",
    "    beta: float=0.8\n",
    "    lr: float=0.001\n",
    "    grad_clip: int=10\n",
    "    batch_size: int=256\n",
    "    input_feature_dim: int=None\n",
    "    low_quantile: int=80\n",
    "    high_quantile: int=100\n",
    "    n_val_samples: int=5000\n",
    "    n_test_samples: int=250000\n",
    "    save_results: bool=False\n",
    "    quiet: bool=False\n",
    "    baselines: str=\"all\"\n",
    "    seed: int=1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "daf615d0-3889-4eb6-b298-730315417e57",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "0f700715-3fee-4e5b-9787-c83bdeee7266",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Args(model='resnet', dataset='imagenet', val_split='test', sel_losses=['bce', 'smmce', 'mce'], cov_loss='quad', scaling='temp', n_epoch=2, coverage_weight=32, beta=0.8, lr=1e-05, grad_clip=10, batch_size=256, input_feature_dim=None, low_quantile=80, high_quantile=100, n_val_samples=2000, n_test_samples=250000, save_results=True, quiet=False, baselines='all', seed=1)\n",
      "(50000, 1000) (50000, 512) (50000,)\n",
      "(2000, 1000) (2000, 512) (2000,)\n",
      "(48000, 1000) (48000, 512) (48000,)\n",
      "(48000, 1000) (48000, 512) (48000,)\n",
      "Before temperature - NLL: 1.130, ECE: 0.046\n",
      "Optimal temperature: 1.131\n",
      "After temperature - NLL: 1.124, ECE: 0.040\n",
      "w, b: 1.130904197692871 None\n",
      "\n",
      "Uncalibrated Validation\n",
      "ECE-1 0.038720067778602284\n",
      "ECE-2 0.03849877043167031\n",
      "\n",
      "Uncalibrated OOD Test\n",
      "ECE-1 0.027692587445684078\n",
      "ECE-2 0.031974035618070384\n",
      "Calibrate Test Using Validation\n",
      "ECE-1 0.019061232810257935\n",
      "ECE-2 0.024962145922080285\n",
      "\n",
      "Histogram Binning\n",
      "ECE-1 0.02785677229454237\n",
      "ECE-2 0.03908354639500136\n",
      "Platt Binning\n",
      "ECE-1 0.022851398581583273\n",
      "ECE-2 0.029826486236563594\n",
      "Platt Scaling\n",
      "ECE-1 0.022705655082767583\n",
      "ECE-2 0.030287400737252848\n",
      "\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Method</th>\n",
       "      <th>ECE-1</th>\n",
       "      <th>ECE-2</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Histogram Binner</td>\n",
       "      <td>0.027857</td>\n",
       "      <td>0.039084</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Platt Binner</td>\n",
       "      <td>0.022851</td>\n",
       "      <td>0.029826</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Temp Scaling</td>\n",
       "      <td>0.019061</td>\n",
       "      <td>0.024962</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>Platt Scaling</td>\n",
       "      <td>0.022706</td>\n",
       "      <td>0.030287</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>Uncalibrated</td>\n",
       "      <td>0.027693</td>\n",
       "      <td>0.031974</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "             Method     ECE-1     ECE-2\n",
       "0  Histogram Binner  0.027857  0.039084\n",
       "1      Platt Binner  0.022851  0.029826\n",
       "2      Temp Scaling  0.019061  0.024962\n",
       "3     Platt Scaling  0.022706  0.030287\n",
       "4      Uncalibrated  0.027693  0.031974"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "##################################################\n",
    "##### ImageNet EXPERIMENT\n",
    "##################################################\n",
    "\n",
    "\n",
    "n_epoch = 2\n",
    "n_val_samples = 2000\n",
    "split = \"test\"\n",
    "lr = 0.00001\n",
    "batch_size=256\n",
    "baselines = \"all\"\n",
    "beta = 0.8\n",
    "low_quantile = int(beta*100)\n",
    "scaling = \"temp\"\n",
    "\n",
    "args = Args(\n",
    "    model = \"resnet\",\n",
    "    dataset = \"imagenet\", \n",
    "    val_split = split,\n",
    "    batch_size = batch_size,\n",
    "    n_epoch = n_epoch,\n",
    "    coverage_weight = 32,\n",
    "    n_val_samples = n_val_samples,\n",
    "    beta=beta,\n",
    "    low_quantile=low_quantile,\n",
    "    baselines = baselines,\n",
    "    scaling=scaling,\n",
    "    sel_losses=[\n",
    "        \"bce\", \n",
    "        \"smmce\",\n",
    "        \"mce\"\n",
    "    ],\n",
    "    lr=lr,\n",
    "    save_results=True,\n",
    ")\n",
    "\n",
    "print(args)\n",
    "res = run_exp(args)\n",
    "print()\n",
    "\n",
    "in_res_df = pd.DataFrame(res, columns=[\"Method\", \"ECE-1\", \"ECE-2\"])\n",
    "in_res_df.to_csv(\"../results/imagenet/id_recalibration_results.csv\", index=False)\n",
    "in_res_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "1c885e6e-4004-42a9-a18a-e24d1ea58b11",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Histogram Binner ECE-1</th>\n",
       "      <th>Histogram Binner ECE-2</th>\n",
       "      <th>Platt Binner ECE-1</th>\n",
       "      <th>Platt Binner ECE-2</th>\n",
       "      <th>Temp Scaling ECE-1</th>\n",
       "      <th>Temp Scaling ECE-2</th>\n",
       "      <th>Platt Scaling ECE-1</th>\n",
       "      <th>Platt Scaling ECE-2</th>\n",
       "      <th>Uncalibrated ECE-1</th>\n",
       "      <th>Uncalibrated ECE-2</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.027857</td>\n",
       "      <td>0.039084</td>\n",
       "      <td>0.022851</td>\n",
       "      <td>0.029826</td>\n",
       "      <td>0.019061</td>\n",
       "      <td>0.024962</td>\n",
       "      <td>0.022706</td>\n",
       "      <td>0.030287</td>\n",
       "      <td>0.027693</td>\n",
       "      <td>0.031974</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Histogram Binner ECE-1  Histogram Binner ECE-2  Platt Binner ECE-1  \\\n",
       "0                0.027857                0.039084            0.022851   \n",
       "\n",
       "   Platt Binner ECE-2  Temp Scaling ECE-1  Temp Scaling ECE-2  \\\n",
       "0            0.029826            0.019061            0.024962   \n",
       "\n",
       "   Platt Scaling ECE-1  Platt Scaling ECE-2  Uncalibrated ECE-1  \\\n",
       "0             0.022706             0.030287            0.027693   \n",
       "\n",
       "   Uncalibrated ECE-2  \n",
       "0            0.031974  "
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "new_rows = []\n",
    "new_cols = []\n",
    "for mtd in in_res_df[\"Method\"].tolist():\n",
    "    row = in_res_df[in_res_df[\"Method\"]==mtd]\n",
    "    new_rows.extend([row[\"ECE-1\"].tolist()[0], row[\"ECE-2\"].tolist()[0]])\n",
    "    new_cols.extend([mtd+\" ECE-1\", mtd+\" ECE-2\"])\n",
    "    \n",
    "in_hor_df = pd.DataFrame([new_rows], columns=new_cols)\n",
    "in_hor_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "d300315d-99ef-4cc6-930a-677ae147e942",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{rrrrrrrrrr}\n",
      "\\toprule\n",
      " Histogram Binner ECE-1 &  Histogram Binner ECE-2 &  Platt Binner ECE-1 &  Platt Binner ECE-2 &  Temp Scaling ECE-1 &  Temp Scaling ECE-2 &  Platt Scaling ECE-1 &  Platt Scaling ECE-2 &  Uncalibrated ECE-1 &  Uncalibrated ECE-2 \\\\\n",
      "\\midrule\n",
      "                  0.028 &                   0.039 &               0.023 &               0.030 &               0.019 &               0.025 &                0.023 &                0.030 &               0.028 &               0.032 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_2543/1957001158.py:1: FutureWarning: In future versions `DataFrame.to_latex` is expected to utilise the base implementation of `Styler.to_latex` for formatting and rendering. The arguments signature may therefore change. It is recommended instead to use `DataFrame.style.to_latex` which also contains additional functionality.\n",
      "  print(in_hor_df.to_latex(float_format=\"%.3f\", index=False))\n"
     ]
    }
   ],
   "source": [
    "print(in_hor_df.to_latex(float_format=\"%.3f\", index=False))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4e65e0ea-8981-4966-bcaa-8113024e43de",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "ba74c82a-b403-491b-b16d-7dd593c7814e",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Args(model='densenet', dataset='camelyon17', val_split='test', sel_losses=['bce', 'smmce'], cov_loss='quad', scaling='temp', n_epoch=1000, coverage_weight=32, beta=0.8, lr=0.0005, grad_clip=10, batch_size=100, input_feature_dim=None, low_quantile=80, high_quantile=100, n_val_samples=1000, n_test_samples=250000, save_results=True, quiet=False, baselines='all', seed=1)\n",
      "(85054, 2) (85054, 1024) (85054,)\n",
      "(1000, 2) (1000, 1024) (1000,)\n",
      "(84054, 2) (84054, 1024) (84054,)\n",
      "(84054, 2) (84054, 1024) (84054,)\n",
      "Before temperature - NLL: 0.473, ECE: 0.109\n",
      "Optimal temperature: 1.980\n",
      "After temperature - NLL: 0.365, ECE: 0.044\n",
      "w, b: 1.9800565242767334 None\n",
      "\n",
      "Uncalibrated Validation\n",
      "ECE-1 0.10906148004531863\n",
      "ECE-2 0.14098452058670902\n",
      "\n",
      "Uncalibrated OOD Test\n",
      "ECE-1 0.10189241453256052\n",
      "ECE-2 0.1420020761806125\n",
      "Calibrate Test Using Validation\n",
      "ECE-1 0.04865575862974108\n",
      "ECE-2 0.06601644496269551\n",
      "\n",
      "Histogram Binning\n",
      "ECE-1 0.025033354158394312\n",
      "ECE-2 0.03540246770169824\n",
      "Platt Binning\n",
      "ECE-1 0.03225142748020865\n",
      "ECE-2 0.03996171233134643\n",
      "Platt Scaling\n",
      "ECE-1 0.03325848489064143\n",
      "ECE-2 0.044065483966656153\n",
      "\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Method</th>\n",
       "      <th>ECE-1</th>\n",
       "      <th>ECE-2</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Histogram Binner</td>\n",
       "      <td>0.025033</td>\n",
       "      <td>0.035402</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Platt Binner</td>\n",
       "      <td>0.032251</td>\n",
       "      <td>0.039962</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Temp Scaling</td>\n",
       "      <td>0.048656</td>\n",
       "      <td>0.066016</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>Platt Scaling</td>\n",
       "      <td>0.033258</td>\n",
       "      <td>0.044065</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>Uncalibrated</td>\n",
       "      <td>0.101892</td>\n",
       "      <td>0.142002</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "             Method     ECE-1     ECE-2\n",
       "0  Histogram Binner  0.025033  0.035402\n",
       "1      Platt Binner  0.032251  0.039962\n",
       "2      Temp Scaling  0.048656  0.066016\n",
       "3     Platt Scaling  0.033258  0.044065\n",
       "4      Uncalibrated  0.101892  0.142002"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# ##################################################\n",
    "# ##### Camelyon17 EXPERIMENT\n",
    "# ##################################################\n",
    "\n",
    "\n",
    "split = \"test\"\n",
    "lr = 0.0005\n",
    "batch_size=100\n",
    "low_quantile = int(beta*100)\n",
    "\n",
    "args = Args(\n",
    "    model = \"densenet\",\n",
    "    dataset = \"camelyon17\", \n",
    "    val_split = split,\n",
    "    batch_size = batch_size,\n",
    "    n_epoch = 1000,\n",
    "    coverage_weight = 32,\n",
    "    n_val_samples = 1000,\n",
    "    beta=beta,\n",
    "    low_quantile=low_quantile,\n",
    "    baselines = \"all\",\n",
    "    sel_losses=[\n",
    "        \"bce\", \n",
    "        \"smmce\"\n",
    "    ],\n",
    "    lr=lr,\n",
    "    save_results=True,\n",
    "    scaling=\"temp\",\n",
    ")\n",
    "print(args)\n",
    "res = run_exp(args)\n",
    "print()\n",
    "\n",
    "cam_res_df = pd.DataFrame(res, columns=[\"Method\", \"ECE-1\", \"ECE-2\"])\n",
    "cam_res_df.to_csv(\"../results/camelyon17/id_recalibration_results.csv\", index=False)\n",
    "cam_res_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "addf0eac-7f20-42bd-ab21-d7510b41993c",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Histogram Binner ECE-1</th>\n",
       "      <th>Histogram Binner ECE-2</th>\n",
       "      <th>Platt Binner ECE-1</th>\n",
       "      <th>Platt Binner ECE-2</th>\n",
       "      <th>Temp Scaling ECE-1</th>\n",
       "      <th>Temp Scaling ECE-2</th>\n",
       "      <th>Platt Scaling ECE-1</th>\n",
       "      <th>Platt Scaling ECE-2</th>\n",
       "      <th>Uncalibrated ECE-1</th>\n",
       "      <th>Uncalibrated ECE-2</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.025033</td>\n",
       "      <td>0.035402</td>\n",
       "      <td>0.032251</td>\n",
       "      <td>0.039962</td>\n",
       "      <td>0.048656</td>\n",
       "      <td>0.066016</td>\n",
       "      <td>0.033258</td>\n",
       "      <td>0.044065</td>\n",
       "      <td>0.101892</td>\n",
       "      <td>0.142002</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Histogram Binner ECE-1  Histogram Binner ECE-2  Platt Binner ECE-1  \\\n",
       "0                0.025033                0.035402            0.032251   \n",
       "\n",
       "   Platt Binner ECE-2  Temp Scaling ECE-1  Temp Scaling ECE-2  \\\n",
       "0            0.039962            0.048656            0.066016   \n",
       "\n",
       "   Platt Scaling ECE-1  Platt Scaling ECE-2  Uncalibrated ECE-1  \\\n",
       "0             0.033258             0.044065            0.101892   \n",
       "\n",
       "   Uncalibrated ECE-2  \n",
       "0            0.142002  "
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "new_rows = []\n",
    "new_cols = []\n",
    "for mtd in cam_res_df[\"Method\"].tolist():\n",
    "    row = cam_res_df[cam_res_df[\"Method\"]==mtd]\n",
    "    new_rows.extend([row[\"ECE-1\"].tolist()[0], row[\"ECE-2\"].tolist()[0]])\n",
    "    new_cols.extend([mtd+\" ECE-1\", mtd+\" ECE-2\"])\n",
    "    \n",
    "cam_hor_df = pd.DataFrame([new_rows], columns=new_cols)\n",
    "cam_hor_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "53f5d72c-e65a-42f8-8a43-ebbcc4bc62cf",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{rrrrrrrrrr}\n",
      "\\toprule\n",
      " Histogram Binner ECE-1 &  Histogram Binner ECE-2 &  Platt Binner ECE-1 &  Platt Binner ECE-2 &  Temp Scaling ECE-1 &  Temp Scaling ECE-2 &  Platt Scaling ECE-1 &  Platt Scaling ECE-2 &  Uncalibrated ECE-1 &  Uncalibrated ECE-2 \\\\\n",
      "\\midrule\n",
      "                  0.025 &                   0.035 &               0.032 &               0.040 &               0.049 &               0.066 &                0.033 &                0.044 &               0.102 &               0.142 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_2543/4154759489.py:1: FutureWarning: In future versions `DataFrame.to_latex` is expected to utilise the base implementation of `Styler.to_latex` for formatting and rendering. The arguments signature may therefore change. It is recommended instead to use `DataFrame.style.to_latex` which also contains additional functionality.\n",
      "  print(cam_hor_df.to_latex(float_format=\"%.3f\", index=False))\n"
     ]
    }
   ],
   "source": [
    "print(cam_hor_df.to_latex(float_format=\"%.3f\", index=False))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "eae35f61-981c-455b-95c9-ca15969551a8",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "4b48fbe6-1381-4dbe-8158-19a55222cae7",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "mtds = in_res_df[\"Method\"].tolist()+cam_res_df[\"Method\"].tolist()\n",
    "mtds = list(set(mtds))\n",
    "\n",
    "rows = []\n",
    "for mtd in mtds:\n",
    "    in_row = in_res_df[in_res_df[\"Method\"] == mtd]\n",
    "    cam_row = cam_res_df[cam_res_df[\"Method\"] == mtd]\n",
    "\n",
    "    row = [mtd]\n",
    "    if len(in_row) > 0:\n",
    "        row.extend([in_row[\"ECE-1\"].tolist()[0], in_row[\"ECE-2\"].tolist()[0]])\n",
    "    else:\n",
    "        row.extend([None, None])\n",
    "    if len(cam_row) > 0:\n",
    "        row.extend([cam_row[\"ECE-1\"].tolist()[0], cam_row[\"ECE-2\"].tolist()[0]])\n",
    "    else:\n",
    "        row.extend([None, None])\n",
    "\n",
    "    rows.append(row)\n",
    "    \n",
    "final_df = pd.DataFrame(rows, columns=[\"Method\", \"ECE-1 (in)\", \"ECE-2 (in)\", \"ECE-1 (cam)\", \"ECE-2 (cam)\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "1522d40c-bf12-4830-8254-beccd6ed4482",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Method</th>\n",
       "      <th>ECE-1 (in)</th>\n",
       "      <th>ECE-2 (in)</th>\n",
       "      <th>ECE-1 (cam)</th>\n",
       "      <th>ECE-2 (cam)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Platt Binner</td>\n",
       "      <td>0.022851</td>\n",
       "      <td>0.029826</td>\n",
       "      <td>0.032251</td>\n",
       "      <td>0.039962</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Histogram Binner</td>\n",
       "      <td>0.027857</td>\n",
       "      <td>0.039084</td>\n",
       "      <td>0.025033</td>\n",
       "      <td>0.035402</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Temp Scaling</td>\n",
       "      <td>0.019061</td>\n",
       "      <td>0.024962</td>\n",
       "      <td>0.048656</td>\n",
       "      <td>0.066016</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>Full</td>\n",
       "      <td>0.027693</td>\n",
       "      <td>0.031974</td>\n",
       "      <td>0.101892</td>\n",
       "      <td>0.142002</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>Platt Scaling</td>\n",
       "      <td>0.022706</td>\n",
       "      <td>0.030287</td>\n",
       "      <td>0.033258</td>\n",
       "      <td>0.044065</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "             Method  ECE-1 (in)  ECE-2 (in)  ECE-1 (cam)  ECE-2 (cam)\n",
       "0      Platt Binner    0.022851    0.029826     0.032251     0.039962\n",
       "1  Histogram Binner    0.027857    0.039084     0.025033     0.035402\n",
       "2      Temp Scaling    0.019061    0.024962     0.048656     0.066016\n",
       "3              Full    0.027693    0.031974     0.101892     0.142002\n",
       "4     Platt Scaling    0.022706    0.030287     0.033258     0.044065"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "final_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "d17dd099-5996-44dd-b6a4-784177b30904",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lrrrr}\n",
      "\\toprule\n",
      "          Method &  ECE-1 (in) &  ECE-2 (in) &  ECE-1 (cam) &  ECE-2 (cam) \\\\\n",
      "\\midrule\n",
      "    Platt Binner &       0.023 &       0.030 &        0.032 &        0.040 \\\\\n",
      "Histogram Binner &       0.028 &       0.039 &        0.025 &        0.035 \\\\\n",
      "    Temp Scaling &       0.019 &       0.025 &        0.049 &        0.066 \\\\\n",
      "            Full &       0.028 &       0.032 &        0.102 &        0.142 \\\\\n",
      "   Platt Scaling &       0.023 &       0.030 &        0.033 &        0.044 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_3997/2434467966.py:1: FutureWarning: In future versions `DataFrame.to_latex` is expected to utilise the base implementation of `Styler.to_latex` for formatting and rendering. The arguments signature may therefore change. It is recommended instead to use `DataFrame.style.to_latex` which also contains additional functionality.\n",
      "  print(final_df.to_latex(float_format=\"%.3f\", index=False))\n"
     ]
    }
   ],
   "source": [
    "print(final_df.to_latex(float_format=\"%.3f\", index=False))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "03d9d99c-e94a-4154-9442-1da7484108dc",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1b9e94c3-0e6b-4191-af4f-68059ef40eca",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "bbd4d69d-bf16-4e8b-9461-a0c24f22f2fb",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "cb129a5d-3e89-452c-8501-e9813b51be80",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
