{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "68f2f490-4df5-467c-8745-36a22a7790e9",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "stty: 'standard input': Inappropriate ioctl for device\n"
     ]
    }
   ],
   "source": [
    "from source.source.table_utils import (\n",
    "    collect_scores_into_dict_miss,\n",
    "    extract_same_different_dataframes,\n",
    "    aggregate_over_measures,\n",
    ")\n",
    "import pandas as pd\n",
    "from source.source.path_config import REPOSITORY_ROOT\n",
    "from source.losses.constants import LossName\n",
    "from source.metrics.constants import GName\n",
    "from source.datasets.constants import DatasetName\n",
    "from source.models.constants import ModelSource\n",
    "\n",
    "import numpy as np\n",
    "import os\n",
    "from IPython.display import display\n",
    "\n",
    "pd.set_option(\"display.max_rows\", None)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "b1198b55-1d45-4ad9-9432-2530e21b103d",
   "metadata": {},
   "outputs": [],
   "source": [
    "ind_dataset = DatasetName.CIFAR10_NOISY_LABEL.value\n",
    "model_source = ModelSource.OUR_MODELS.value\n",
    "\n",
    "full_mis_rocauc = pd.read_pickle(\n",
    "    f\"{REPOSITORY_ROOT}/tables/central_tables/final/{ind_dataset}_{model_source}_full_mis_rocauc.pkl\"\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "a1cd7550-8bc7-47be-a8c2-c9e784ec19bd",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>UQMetric</th>\n",
       "      <th>LossFunction</th>\n",
       "      <th>RocAucScores_array</th>\n",
       "      <th>architecture</th>\n",
       "      <th>training_dataset</th>\n",
       "      <th>base_rule</th>\n",
       "      <th>RiskType</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>LogScore TotalRisk inner central</td>\n",
       "      <td>CrossEntropy</td>\n",
       "      <td>[0.6912572280870063, 0.8144304905229434, 0.816...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>LogScore</td>\n",
       "      <td>inner central</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>190</th>\n",
       "      <td>SphericalScore TotalRisk outer outer</td>\n",
       "      <td>BrierScore</td>\n",
       "      <td>[0.8226008000593636, 0.7914094185461955, 0.752...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>SphericalScore</td>\n",
       "      <td>outer outer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>133</th>\n",
       "      <td>ZeroOneScore TotalRisk outer central</td>\n",
       "      <td>BrierScore</td>\n",
       "      <td>[0.8292069563340282, 0.8203730465301489, 0.740...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>ZeroOneScore</td>\n",
       "      <td>outer central</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>186</th>\n",
       "      <td>ZeroOneScore BayesRisk central</td>\n",
       "      <td>CrossEntropy</td>\n",
       "      <td>[0.7820142650723241, 0.837232767292478, 0.8115...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>ZeroOneScore</td>\n",
       "      <td>central</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>146</th>\n",
       "      <td>ZeroOneScore TotalRisk central outer</td>\n",
       "      <td>SphericalScore</td>\n",
       "      <td>[0.8507520993063161, 0.8363808616492008, 0.837...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>ZeroOneScore</td>\n",
       "      <td>central outer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>121</th>\n",
       "      <td>BrierScore BayesRisk inner</td>\n",
       "      <td>BrierScore</td>\n",
       "      <td>[0.8281574686823305, 0.7996790886607885, 0.756...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>BrierScore</td>\n",
       "      <td>inner</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>253</th>\n",
       "      <td>LogScore energy outer</td>\n",
       "      <td>BrierScore</td>\n",
       "      <td>[0.79704163546705, 0.7726924115938734, 0.73440...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>LogScore</td>\n",
       "      <td>energy outer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>173</th>\n",
       "      <td>ZeroOneScore ExcessRisk central outer</td>\n",
       "      <td>SphericalScore</td>\n",
       "      <td>[0.8733727796561741, 0.8271212460849693, 0.852...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>ZeroOneScore</td>\n",
       "      <td>central outer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>135</th>\n",
       "      <td>ZeroOneScore TotalRisk inner outer</td>\n",
       "      <td>CrossEntropy</td>\n",
       "      <td>[0.7967131983032528, 0.8441712524894938, 0.808...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>ZeroOneScore</td>\n",
       "      <td>inner outer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>120</th>\n",
       "      <td>BrierScore BayesRisk inner</td>\n",
       "      <td>CrossEntropy</td>\n",
       "      <td>[0.7371669151970955, 0.8334137516389305, 0.836...</td>\n",
       "      <td>resnet18</td>\n",
       "      <td>cifar10_noisy_label</td>\n",
       "      <td>BrierScore</td>\n",
       "      <td>inner</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                  UQMetric    LossFunction  \\\n",
       "15        LogScore TotalRisk inner central    CrossEntropy   \n",
       "190   SphericalScore TotalRisk outer outer      BrierScore   \n",
       "133   ZeroOneScore TotalRisk outer central      BrierScore   \n",
       "186         ZeroOneScore BayesRisk central    CrossEntropy   \n",
       "146   ZeroOneScore TotalRisk central outer  SphericalScore   \n",
       "121             BrierScore BayesRisk inner      BrierScore   \n",
       "253                  LogScore energy outer      BrierScore   \n",
       "173  ZeroOneScore ExcessRisk central outer  SphericalScore   \n",
       "135     ZeroOneScore TotalRisk inner outer    CrossEntropy   \n",
       "120             BrierScore BayesRisk inner    CrossEntropy   \n",
       "\n",
       "                                    RocAucScores_array architecture  \\\n",
       "15   [0.6912572280870063, 0.8144304905229434, 0.816...     resnet18   \n",
       "190  [0.8226008000593636, 0.7914094185461955, 0.752...     resnet18   \n",
       "133  [0.8292069563340282, 0.8203730465301489, 0.740...     resnet18   \n",
       "186  [0.7820142650723241, 0.837232767292478, 0.8115...     resnet18   \n",
       "146  [0.8507520993063161, 0.8363808616492008, 0.837...     resnet18   \n",
       "121  [0.8281574686823305, 0.7996790886607885, 0.756...     resnet18   \n",
       "253  [0.79704163546705, 0.7726924115938734, 0.73440...     resnet18   \n",
       "173  [0.8733727796561741, 0.8271212460849693, 0.852...     resnet18   \n",
       "135  [0.7967131983032528, 0.8441712524894938, 0.808...     resnet18   \n",
       "120  [0.7371669151970955, 0.8334137516389305, 0.836...     resnet18   \n",
       "\n",
       "        training_dataset       base_rule       RiskType  \n",
       "15   cifar10_noisy_label        LogScore  inner central  \n",
       "190  cifar10_noisy_label  SphericalScore    outer outer  \n",
       "133  cifar10_noisy_label    ZeroOneScore  outer central  \n",
       "186  cifar10_noisy_label    ZeroOneScore        central  \n",
       "146  cifar10_noisy_label    ZeroOneScore  central outer  \n",
       "121  cifar10_noisy_label      BrierScore          inner  \n",
       "253  cifar10_noisy_label        LogScore   energy outer  \n",
       "173  cifar10_noisy_label    ZeroOneScore  central outer  \n",
       "135  cifar10_noisy_label    ZeroOneScore    inner outer  \n",
       "120  cifar10_noisy_label      BrierScore          inner  "
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "full_mis_rocauc.sample(10)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "2bcc7fc1-3728-42c4-8dca-ba26310aa564",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array(['cifar10_noisy_label'], dtype=object)"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "full_mis_rocauc.training_dataset.unique()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "a518565c-bdd2-4a6a-8fa2-ab630fab3f37",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.48775359511468824"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.hstack(full_mis_rocauc.RocAucScores_array.values).min()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4ac208c7-6da1-4642-b9d1-66547547e820",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "f0400b90-e628-4ff6-96a8-f90e70f3523d",
   "metadata": {},
   "outputs": [],
   "source": [
    "def selector(\n",
    "    df,\n",
    "    architecture,\n",
    "    UQMetric,\n",
    "):\n",
    "    arr = np.array(\n",
    "        df[\n",
    "            (df.UQMetric == UQMetric)\n",
    "            & (df.architecture == architecture)\n",
    "        ].RocAucScores_array.values[0]\n",
    "    )\n",
    "    # print(arr)\n",
    "\n",
    "    # return f\"Mean: {arr.mean()}, Std: {arr.std()}\"\n",
    "    return float(arr.mean()), float(arr.std())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "1c2bc9a8-c4a9-40a2-9cf6-1b39e0e4fe25",
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_specific_stats(\n",
    "    architecture_,\n",
    "    loss_function_,\n",
    "    base_rule_,\n",
    "):\n",
    "    selected_results = full_mis_rocauc[\n",
    "        (full_mis_rocauc.base_rule == base_rule_)\n",
    "        & (full_mis_rocauc.LossFunction == loss_function_)\n",
    "    ]\n",
    "\n",
    "    full_res = {}\n",
    "    res_dict = {}\n",
    "    for uqmetric_name in [\n",
    "        el for el in full_mis_rocauc.UQMetric.unique() if el.startswith(base_rule_)\n",
    "    ]:\n",
    "        mean, std = selector(\n",
    "            df=selected_results,\n",
    "            UQMetric=uqmetric_name,\n",
    "            architecture=architecture_,\n",
    "        )\n",
    "        res_dict[uqmetric_name] = {\"mean\": mean, \"std\": std}\n",
    "    full_res = res_dict\n",
    "\n",
    "    return full_res"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5eea5252-06cb-49dc-831e-7e85472e5ee6",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0dc807fa-c9ab-44fd-bcce-9fda28ca848b",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "3094f898-d89b-4633-a45e-2dc8ebd30eb2",
   "metadata": {},
   "outputs": [],
   "source": [
    "# full_mis_rocauc['training_dataset'].unique()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8875e40a-a710-43fe-91b6-049ec14e9eec",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "a9062e8d-c5d5-45c6-909c-434e404a95ba",
   "metadata": {},
   "outputs": [],
   "source": [
    "architecture = \"resnet18\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "8c865844-5ee3-49e6-8fce-94c09cf01955",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk outer outer</th>\n",
       "      <td>0.757266</td>\n",
       "      <td>0.046807</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk outer inner</th>\n",
       "      <td>0.783553</td>\n",
       "      <td>0.047686</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk outer central</th>\n",
       "      <td>0.762649</td>\n",
       "      <td>0.050384</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk inner outer</th>\n",
       "      <td>0.757266</td>\n",
       "      <td>0.046807</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk inner inner</th>\n",
       "      <td>0.783553</td>\n",
       "      <td>0.047686</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk inner central</th>\n",
       "      <td>0.762649</td>\n",
       "      <td>0.050384</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk central outer</th>\n",
       "      <td>0.793767</td>\n",
       "      <td>0.038486</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk central inner</th>\n",
       "      <td>0.802061</td>\n",
       "      <td>0.039641</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk central central</th>\n",
       "      <td>0.804374</td>\n",
       "      <td>0.036907</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk outer outer</th>\n",
       "      <td>0.683930</td>\n",
       "      <td>0.060733</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk outer inner</th>\n",
       "      <td>0.696427</td>\n",
       "      <td>0.061025</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk outer central</th>\n",
       "      <td>0.668474</td>\n",
       "      <td>0.059358</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk inner outer</th>\n",
       "      <td>0.676975</td>\n",
       "      <td>0.060858</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk inner inner</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk inner central</th>\n",
       "      <td>0.592383</td>\n",
       "      <td>0.061051</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk central outer</th>\n",
       "      <td>0.699839</td>\n",
       "      <td>0.060773</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk central inner</th>\n",
       "      <td>0.612817</td>\n",
       "      <td>0.065255</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk central central</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore BayesRisk outer</th>\n",
       "      <td>0.782573</td>\n",
       "      <td>0.041099</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore BayesRisk inner</th>\n",
       "      <td>0.783553</td>\n",
       "      <td>0.047686</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore BayesRisk central</th>\n",
       "      <td>0.804374</td>\n",
       "      <td>0.036907</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore energy outer</th>\n",
       "      <td>0.746138</td>\n",
       "      <td>0.052281</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore energy inner</th>\n",
       "      <td>0.748162</td>\n",
       "      <td>0.054774</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                         mean       std\n",
       "LogScore TotalRisk outer outer       0.757266  0.046807\n",
       "LogScore TotalRisk outer inner       0.783553  0.047686\n",
       "LogScore TotalRisk outer central     0.762649  0.050384\n",
       "LogScore TotalRisk inner outer       0.757266  0.046807\n",
       "LogScore TotalRisk inner inner       0.783553  0.047686\n",
       "LogScore TotalRisk inner central     0.762649  0.050384\n",
       "LogScore TotalRisk central outer     0.793767  0.038486\n",
       "LogScore TotalRisk central inner     0.802061  0.039641\n",
       "LogScore TotalRisk central central   0.804374  0.036907\n",
       "LogScore ExcessRisk outer outer      0.683930  0.060733\n",
       "LogScore ExcessRisk outer inner      0.696427  0.061025\n",
       "LogScore ExcessRisk outer central    0.668474  0.059358\n",
       "LogScore ExcessRisk inner outer      0.676975  0.060858\n",
       "LogScore ExcessRisk inner inner      0.500000  0.000000\n",
       "LogScore ExcessRisk inner central    0.592383  0.061051\n",
       "LogScore ExcessRisk central outer    0.699839  0.060773\n",
       "LogScore ExcessRisk central inner    0.612817  0.065255\n",
       "LogScore ExcessRisk central central  0.500000  0.000000\n",
       "LogScore BayesRisk outer             0.782573  0.041099\n",
       "LogScore BayesRisk inner             0.783553  0.047686\n",
       "LogScore BayesRisk central           0.804374  0.036907\n",
       "LogScore energy outer                0.746138  0.052281\n",
       "LogScore energy inner                0.748162  0.054774"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "ce_full_res = get_specific_stats(\n",
    "    architecture_=architecture,\n",
    "    loss_function_=LossName.CROSS_ENTROPY.value,\n",
    "    base_rule_=GName.LOG_SCORE.value,\n",
    ")\n",
    "\n",
    "pd.DataFrame.from_dict(ce_full_res).T"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "6c36db38-e7e4-4c04-87f1-056267c6bf1a",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>BrierScore TotalRisk outer outer</th>\n",
       "      <td>0.788128</td>\n",
       "      <td>0.036038</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore TotalRisk outer inner</th>\n",
       "      <td>0.796245</td>\n",
       "      <td>0.038219</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore TotalRisk outer central</th>\n",
       "      <td>0.796245</td>\n",
       "      <td>0.038219</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore TotalRisk inner outer</th>\n",
       "      <td>0.788128</td>\n",
       "      <td>0.036038</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore TotalRisk inner inner</th>\n",
       "      <td>0.796245</td>\n",
       "      <td>0.038220</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore TotalRisk inner central</th>\n",
       "      <td>0.796245</td>\n",
       "      <td>0.038220</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore TotalRisk central outer</th>\n",
       "      <td>0.788128</td>\n",
       "      <td>0.036038</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore TotalRisk central inner</th>\n",
       "      <td>0.796245</td>\n",
       "      <td>0.038220</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore TotalRisk central central</th>\n",
       "      <td>0.796245</td>\n",
       "      <td>0.038220</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore ExcessRisk outer outer</th>\n",
       "      <td>0.720286</td>\n",
       "      <td>0.036689</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore ExcessRisk outer inner</th>\n",
       "      <td>0.720286</td>\n",
       "      <td>0.036689</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore ExcessRisk outer central</th>\n",
       "      <td>0.720286</td>\n",
       "      <td>0.036689</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore ExcessRisk inner outer</th>\n",
       "      <td>0.720286</td>\n",
       "      <td>0.036689</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore ExcessRisk inner inner</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore ExcessRisk inner central</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore ExcessRisk central outer</th>\n",
       "      <td>0.720286</td>\n",
       "      <td>0.036689</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore ExcessRisk central inner</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore ExcessRisk central central</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore BayesRisk outer</th>\n",
       "      <td>0.764098</td>\n",
       "      <td>0.032527</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore BayesRisk inner</th>\n",
       "      <td>0.796245</td>\n",
       "      <td>0.038220</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BrierScore BayesRisk central</th>\n",
       "      <td>0.796245</td>\n",
       "      <td>0.038220</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                           mean       std\n",
       "BrierScore TotalRisk outer outer       0.788128  0.036038\n",
       "BrierScore TotalRisk outer inner       0.796245  0.038219\n",
       "BrierScore TotalRisk outer central     0.796245  0.038219\n",
       "BrierScore TotalRisk inner outer       0.788128  0.036038\n",
       "BrierScore TotalRisk inner inner       0.796245  0.038220\n",
       "BrierScore TotalRisk inner central     0.796245  0.038220\n",
       "BrierScore TotalRisk central outer     0.788128  0.036038\n",
       "BrierScore TotalRisk central inner     0.796245  0.038220\n",
       "BrierScore TotalRisk central central   0.796245  0.038220\n",
       "BrierScore ExcessRisk outer outer      0.720286  0.036689\n",
       "BrierScore ExcessRisk outer inner      0.720286  0.036689\n",
       "BrierScore ExcessRisk outer central    0.720286  0.036689\n",
       "BrierScore ExcessRisk inner outer      0.720286  0.036689\n",
       "BrierScore ExcessRisk inner inner      0.500000  0.000000\n",
       "BrierScore ExcessRisk inner central    0.500000  0.000000\n",
       "BrierScore ExcessRisk central outer    0.720286  0.036689\n",
       "BrierScore ExcessRisk central inner    0.500000  0.000000\n",
       "BrierScore ExcessRisk central central  0.500000  0.000000\n",
       "BrierScore BayesRisk outer             0.764098  0.032527\n",
       "BrierScore BayesRisk inner             0.796245  0.038220\n",
       "BrierScore BayesRisk central           0.796245  0.038220"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "ce_full_res = get_specific_stats(\n",
    "    architecture_=architecture,\n",
    "    loss_function_=LossName.CROSS_ENTROPY.value,\n",
    "    base_rule_=GName.BRIER_SCORE.value,\n",
    ")\n",
    "\n",
    "pd.DataFrame.from_dict(ce_full_res).T"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "79531885-208f-468a-9b8c-9f124e8200e1",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "33dee21d-6850-479c-91ad-e325a59e45a7",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore TotalRisk outer outer</th>\n",
       "      <td>0.816813</td>\n",
       "      <td>0.016673</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore TotalRisk outer inner</th>\n",
       "      <td>0.809268</td>\n",
       "      <td>0.018199</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore TotalRisk outer central</th>\n",
       "      <td>0.809268</td>\n",
       "      <td>0.018199</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore TotalRisk inner outer</th>\n",
       "      <td>0.816813</td>\n",
       "      <td>0.016673</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore TotalRisk inner inner</th>\n",
       "      <td>0.809268</td>\n",
       "      <td>0.018199</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore TotalRisk inner central</th>\n",
       "      <td>0.809268</td>\n",
       "      <td>0.018199</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore TotalRisk central outer</th>\n",
       "      <td>0.816813</td>\n",
       "      <td>0.016673</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore TotalRisk central inner</th>\n",
       "      <td>0.809268</td>\n",
       "      <td>0.018199</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore TotalRisk central central</th>\n",
       "      <td>0.809268</td>\n",
       "      <td>0.018199</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore ExcessRisk outer outer</th>\n",
       "      <td>0.764256</td>\n",
       "      <td>0.030609</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore ExcessRisk outer inner</th>\n",
       "      <td>0.780974</td>\n",
       "      <td>0.032516</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore ExcessRisk outer central</th>\n",
       "      <td>0.780974</td>\n",
       "      <td>0.032516</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore ExcessRisk inner outer</th>\n",
       "      <td>0.721795</td>\n",
       "      <td>0.021412</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore ExcessRisk inner inner</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore ExcessRisk inner central</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore ExcessRisk central outer</th>\n",
       "      <td>0.721795</td>\n",
       "      <td>0.021412</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore ExcessRisk central inner</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore ExcessRisk central central</th>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore BayesRisk outer</th>\n",
       "      <td>0.746145</td>\n",
       "      <td>0.021217</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore BayesRisk inner</th>\n",
       "      <td>0.809268</td>\n",
       "      <td>0.018199</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ZeroOneScore BayesRisk central</th>\n",
       "      <td>0.809268</td>\n",
       "      <td>0.018199</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                             mean       std\n",
       "ZeroOneScore TotalRisk outer outer       0.816813  0.016673\n",
       "ZeroOneScore TotalRisk outer inner       0.809268  0.018199\n",
       "ZeroOneScore TotalRisk outer central     0.809268  0.018199\n",
       "ZeroOneScore TotalRisk inner outer       0.816813  0.016673\n",
       "ZeroOneScore TotalRisk inner inner       0.809268  0.018199\n",
       "ZeroOneScore TotalRisk inner central     0.809268  0.018199\n",
       "ZeroOneScore TotalRisk central outer     0.816813  0.016673\n",
       "ZeroOneScore TotalRisk central inner     0.809268  0.018199\n",
       "ZeroOneScore TotalRisk central central   0.809268  0.018199\n",
       "ZeroOneScore ExcessRisk outer outer      0.764256  0.030609\n",
       "ZeroOneScore ExcessRisk outer inner      0.780974  0.032516\n",
       "ZeroOneScore ExcessRisk outer central    0.780974  0.032516\n",
       "ZeroOneScore ExcessRisk inner outer      0.721795  0.021412\n",
       "ZeroOneScore ExcessRisk inner inner      0.500000  0.000000\n",
       "ZeroOneScore ExcessRisk inner central    0.500000  0.000000\n",
       "ZeroOneScore ExcessRisk central outer    0.721795  0.021412\n",
       "ZeroOneScore ExcessRisk central inner    0.500000  0.000000\n",
       "ZeroOneScore ExcessRisk central central  0.500000  0.000000\n",
       "ZeroOneScore BayesRisk outer             0.746145  0.021217\n",
       "ZeroOneScore BayesRisk inner             0.809268  0.018199\n",
       "ZeroOneScore BayesRisk central           0.809268  0.018199"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "ce_full_res = get_specific_stats(\n",
    "    architecture_=architecture,\n",
    "    loss_function_=LossName.CROSS_ENTROPY.value,\n",
    "    base_rule_=GName.ZERO_ONE_SCORE.value,\n",
    ")\n",
    "\n",
    "ce_zo = pd.DataFrame.from_dict(ce_full_res).T\n",
    "\n",
    "ce_zo"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d46b3bea-e538-4212-8841-7df68f59e8f3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "924ffc7a-d600-42ac-b832-7af46e38ce69",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1476f355-ce55-4fcb-8b4b-c19bb8dd3ac5",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "cffe0140-69d6-49e7-a749-06b3c4c9dbbf",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "id": "08232774-49a4-480c-8b79-afa01fe5af28",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "CrossEntropy LogScore\n",
      "CrossEntropy BrierScore\n",
      "CrossEntropy SphericalScore\n",
      "CrossEntropy ZeroOneScore\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_1729049/4265140004.py:58: FutureWarning: DataFrame.applymap has been deprecated. Use DataFrame.map instead.\n",
      "  mean_tab = 100 * df_aux.applymap(lambda x: x['mean']).round(4)\n",
      "/tmp/ipykernel_1729049/4265140004.py:59: FutureWarning: DataFrame.applymap has been deprecated. Use DataFrame.map instead.\n",
      "  std_tab = 100 * df_aux.applymap(lambda x: x['std']).round(4)\n",
      "/tmp/ipykernel_1729049/4265140004.py:58: FutureWarning: DataFrame.applymap has been deprecated. Use DataFrame.map instead.\n",
      "  mean_tab = 100 * df_aux.applymap(lambda x: x['mean']).round(4)\n",
      "/tmp/ipykernel_1729049/4265140004.py:59: FutureWarning: DataFrame.applymap has been deprecated. Use DataFrame.map instead.\n",
      "  std_tab = 100 * df_aux.applymap(lambda x: x['std']).round(4)\n",
      "/tmp/ipykernel_1729049/4265140004.py:58: FutureWarning: DataFrame.applymap has been deprecated. Use DataFrame.map instead.\n",
      "  mean_tab = 100 * df_aux.applymap(lambda x: x['mean']).round(4)\n",
      "/tmp/ipykernel_1729049/4265140004.py:59: FutureWarning: DataFrame.applymap has been deprecated. Use DataFrame.map instead.\n",
      "  std_tab = 100 * df_aux.applymap(lambda x: x['std']).round(4)\n",
      "/tmp/ipykernel_1729049/4265140004.py:58: FutureWarning: DataFrame.applymap has been deprecated. Use DataFrame.map instead.\n",
      "  mean_tab = 100 * df_aux.applymap(lambda x: x['mean']).round(4)\n",
      "/tmp/ipykernel_1729049/4265140004.py:59: FutureWarning: DataFrame.applymap has been deprecated. Use DataFrame.map instead.\n",
      "  std_tab = 100 * df_aux.applymap(lambda x: x['std']).round(4)\n"
     ]
    }
   ],
   "source": [
    "full_mean_tab = None\n",
    "full_std_tab = None\n",
    "\n",
    "full_index = None\n",
    "\n",
    "for ind_dataset, model_source in [\n",
    "    # (DatasetName.CIFAR10.value, ModelSource.OUR_MODELS.value),\n",
    "    # (DatasetName.CIFAR100.value, ModelSource.OUR_MODELS.value),\n",
    "    # (DatasetName.CIFAR10_NOISY_LABEL.value, ModelSource.OUR_MODELS.value),\n",
    "    # (DatasetName.CIFAR100_NOISY_LABEL.value, ModelSource.OUR_MODELS.value),\n",
    "    (DatasetName.TINY_IMAGENET.value, ModelSource.TORCH_UNCERTAINTY.value),\n",
    "]:\n",
    "\n",
    "    full_mis_rocauc = pd.read_pickle(\n",
    "        f\"{REPOSITORY_ROOT}/tables/central_tables/final/{ind_dataset}_{model_source}_full_mis_rocauc.pkl\"\n",
    "    )\n",
    "    \n",
    "    # for (loss_function_, base_rule_) in [\n",
    "    #     # (LossName.CROSS_ENTROPY.value, GName.LOG_SCORE.value),\n",
    "    #     # (LossName.BRIER_SCORE.value, GName.BRIER_SCORE.value),\n",
    "    #     (LossName.SPHERICAL_SCORE.value, GName.SPHERICAL_SCORE.value),\n",
    "    # ]:\n",
    "    for (loss_function_, base_rule_) in [\n",
    "        (LossName.CROSS_ENTROPY.value, GName.LOG_SCORE.value),\n",
    "        (LossName.CROSS_ENTROPY.value, GName.BRIER_SCORE.value),\n",
    "        (LossName.CROSS_ENTROPY.value, GName.SPHERICAL_SCORE.value),\n",
    "        (LossName.CROSS_ENTROPY.value, GName.ZERO_ONE_SCORE.value),\n",
    "    ]:\n",
    "        print(loss_function_, base_rule_)\n",
    "        ce_full_res = get_specific_stats(\n",
    "            architecture_=architecture,\n",
    "            loss_function_=loss_function_,\n",
    "            base_rule_=base_rule_,\n",
    "        )\n",
    "        ce_full_res = {ind_dataset: ce_full_res}\n",
    "        \n",
    "        pd.DataFrame.from_dict(ce_full_res).sort_index()\n",
    "        \n",
    "        # df_aux = pd.DataFrame.from_dict(ce_full_res).loc[\n",
    "        #     [\n",
    "        #     f\"{base_rule_} BayesRisk outer\",\n",
    "        #     f\"{base_rule_} BayesRisk inner\",\n",
    "        #     f\"{base_rule_} BayesRisk central\",\n",
    "        #     f\"{base_rule_} ExcessRisk outer outer\",\n",
    "        #     f\"{base_rule_} ExcessRisk outer inner\",\n",
    "        #     f\"{base_rule_} ExcessRisk inner outer\",\n",
    "        #     f\"{base_rule_} ExcessRisk outer central\",\n",
    "        #     f\"{base_rule_} ExcessRisk central outer\",\n",
    "        #     f\"{base_rule_} TotalRisk outer outer\",\n",
    "        #     f\"{base_rule_} TotalRisk outer inner\",\n",
    "        #     f\"{base_rule_} TotalRisk outer central\",\n",
    "        #     f\"{base_rule_} TotalRisk central outer\",\n",
    "        #     ]\n",
    "        # ]\n",
    "        \n",
    "        df_aux = pd.DataFrame.from_dict(ce_full_res).sort_index()\n",
    "        \n",
    "        mean_tab = 100 * df_aux.applymap(lambda x: x['mean']).round(4)\n",
    "        std_tab = 100 * df_aux.applymap(lambda x: x['std']).round(4)\n",
    "\n",
    "        if (loss_function_ == LossName.CROSS_ENTROPY.value) and (base_rule_ == GName.LOG_SCORE.value):\n",
    "            full_index = mean_tab.index\n",
    "    \n",
    "        if full_mean_tab is None:\n",
    "            # full_mean_tab = mean_tab\n",
    "            # full_std_tab = std_tab\n",
    "            full_mean_tab = mean_tab.reset_index().drop(columns=['index'])\n",
    "            full_std_tab = std_tab.reset_index().drop(columns=['index'])\n",
    "        else:\n",
    "            # full_mean_tab = pd.DataFrame.join(full_mean_tab, mean_tab)\n",
    "            # full_std_tab = pd.DataFrame.join(full_std_tab, std_tab)\n",
    "\n",
    "            full_mean_tab= pd.concat([full_mean_tab, mean_tab.reset_index().drop(columns=['index'])], axis=1, ignore_index=True)\n",
    "            full_std_tab= pd.concat([full_std_tab, std_tab.reset_index().drop(columns=['index'])], axis=1, ignore_index=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6e536bce-0bfb-4243-b494-8bba0030b87d",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "id": "0b637af0-a314-4e5c-be6a-41e97b33d3aa",
   "metadata": {},
   "outputs": [],
   "source": [
    "# full_mean_tab.index = full_index\n",
    "# full_std_tab.index = full_index"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "id": "8bc42644-72ac-49d2-bf4c-8d62bb7a49db",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>0</th>\n",
       "      <th>1</th>\n",
       "      <th>2</th>\n",
       "      <th>3</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>LogScore BayesRisk central</th>\n",
       "      <td>86.55</td>\n",
       "      <td>86.80</td>\n",
       "      <td>85.83</td>\n",
       "      <td>87.23</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore BayesRisk inner</th>\n",
       "      <td>85.50</td>\n",
       "      <td>86.80</td>\n",
       "      <td>86.80</td>\n",
       "      <td>87.23</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore BayesRisk outer</th>\n",
       "      <td>84.99</td>\n",
       "      <td>85.89</td>\n",
       "      <td>85.76</td>\n",
       "      <td>85.88</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk central central</th>\n",
       "      <td>50.00</td>\n",
       "      <td>50.00</td>\n",
       "      <td>50.00</td>\n",
       "      <td>50.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk central inner</th>\n",
       "      <td>71.77</td>\n",
       "      <td>50.00</td>\n",
       "      <td>81.82</td>\n",
       "      <td>50.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk central outer</th>\n",
       "      <td>82.74</td>\n",
       "      <td>75.91</td>\n",
       "      <td>83.60</td>\n",
       "      <td>73.59</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk inner central</th>\n",
       "      <td>66.83</td>\n",
       "      <td>50.00</td>\n",
       "      <td>78.32</td>\n",
       "      <td>50.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk inner inner</th>\n",
       "      <td>50.00</td>\n",
       "      <td>50.00</td>\n",
       "      <td>50.00</td>\n",
       "      <td>50.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk inner outer</th>\n",
       "      <td>80.18</td>\n",
       "      <td>75.91</td>\n",
       "      <td>79.62</td>\n",
       "      <td>73.59</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk outer central</th>\n",
       "      <td>79.25</td>\n",
       "      <td>75.91</td>\n",
       "      <td>80.73</td>\n",
       "      <td>79.52</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk outer inner</th>\n",
       "      <td>83.22</td>\n",
       "      <td>75.91</td>\n",
       "      <td>81.95</td>\n",
       "      <td>79.52</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk outer outer</th>\n",
       "      <td>81.33</td>\n",
       "      <td>75.91</td>\n",
       "      <td>81.02</td>\n",
       "      <td>76.78</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk central central</th>\n",
       "      <td>86.55</td>\n",
       "      <td>86.80</td>\n",
       "      <td>85.83</td>\n",
       "      <td>87.23</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk central inner</th>\n",
       "      <td>86.50</td>\n",
       "      <td>86.80</td>\n",
       "      <td>85.39</td>\n",
       "      <td>87.23</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk central outer</th>\n",
       "      <td>86.65</td>\n",
       "      <td>86.40</td>\n",
       "      <td>85.43</td>\n",
       "      <td>86.95</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk inner central</th>\n",
       "      <td>85.18</td>\n",
       "      <td>86.80</td>\n",
       "      <td>86.90</td>\n",
       "      <td>87.23</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk inner inner</th>\n",
       "      <td>85.50</td>\n",
       "      <td>86.80</td>\n",
       "      <td>86.80</td>\n",
       "      <td>87.23</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk inner outer</th>\n",
       "      <td>85.58</td>\n",
       "      <td>86.40</td>\n",
       "      <td>86.92</td>\n",
       "      <td>86.95</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk outer central</th>\n",
       "      <td>85.18</td>\n",
       "      <td>86.80</td>\n",
       "      <td>86.90</td>\n",
       "      <td>87.23</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk outer inner</th>\n",
       "      <td>85.50</td>\n",
       "      <td>86.80</td>\n",
       "      <td>86.80</td>\n",
       "      <td>87.23</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk outer outer</th>\n",
       "      <td>85.58</td>\n",
       "      <td>86.40</td>\n",
       "      <td>86.92</td>\n",
       "      <td>86.95</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore energy inner</th>\n",
       "      <td>83.34</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore energy outer</th>\n",
       "      <td>82.40</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                         0      1      2      3\n",
       "LogScore BayesRisk central           86.55  86.80  85.83  87.23\n",
       "LogScore BayesRisk inner             85.50  86.80  86.80  87.23\n",
       "LogScore BayesRisk outer             84.99  85.89  85.76  85.88\n",
       "LogScore ExcessRisk central central  50.00  50.00  50.00  50.00\n",
       "LogScore ExcessRisk central inner    71.77  50.00  81.82  50.00\n",
       "LogScore ExcessRisk central outer    82.74  75.91  83.60  73.59\n",
       "LogScore ExcessRisk inner central    66.83  50.00  78.32  50.00\n",
       "LogScore ExcessRisk inner inner      50.00  50.00  50.00  50.00\n",
       "LogScore ExcessRisk inner outer      80.18  75.91  79.62  73.59\n",
       "LogScore ExcessRisk outer central    79.25  75.91  80.73  79.52\n",
       "LogScore ExcessRisk outer inner      83.22  75.91  81.95  79.52\n",
       "LogScore ExcessRisk outer outer      81.33  75.91  81.02  76.78\n",
       "LogScore TotalRisk central central   86.55  86.80  85.83  87.23\n",
       "LogScore TotalRisk central inner     86.50  86.80  85.39  87.23\n",
       "LogScore TotalRisk central outer     86.65  86.40  85.43  86.95\n",
       "LogScore TotalRisk inner central     85.18  86.80  86.90  87.23\n",
       "LogScore TotalRisk inner inner       85.50  86.80  86.80  87.23\n",
       "LogScore TotalRisk inner outer       85.58  86.40  86.92  86.95\n",
       "LogScore TotalRisk outer central     85.18  86.80  86.90  87.23\n",
       "LogScore TotalRisk outer inner       85.50  86.80  86.80  87.23\n",
       "LogScore TotalRisk outer outer       85.58  86.40  86.92  86.95\n",
       "LogScore energy inner                83.34    NaN    NaN    NaN\n",
       "LogScore energy outer                82.40    NaN    NaN    NaN"
      ]
     },
     "execution_count": 53,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "full_mean_tab = full_mean_tab.sort_index()\n",
    "full_mean_tab"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 54,
   "id": "fdea9ae4-bb78-475f-9493-5ca7eb7c9d2e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>0</th>\n",
       "      <th>1</th>\n",
       "      <th>2</th>\n",
       "      <th>3</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>LogScore BayesRisk central</th>\n",
       "      <td>0.26</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.36</td>\n",
       "      <td>0.35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore BayesRisk inner</th>\n",
       "      <td>0.23</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore BayesRisk outer</th>\n",
       "      <td>0.24</td>\n",
       "      <td>0.27</td>\n",
       "      <td>0.26</td>\n",
       "      <td>0.27</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk central central</th>\n",
       "      <td>0.00</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk central inner</th>\n",
       "      <td>0.13</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.47</td>\n",
       "      <td>0.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk central outer</th>\n",
       "      <td>0.34</td>\n",
       "      <td>0.59</td>\n",
       "      <td>0.47</td>\n",
       "      <td>0.44</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk inner central</th>\n",
       "      <td>0.11</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.58</td>\n",
       "      <td>0.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk inner inner</th>\n",
       "      <td>0.00</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk inner outer</th>\n",
       "      <td>0.31</td>\n",
       "      <td>0.59</td>\n",
       "      <td>0.54</td>\n",
       "      <td>0.44</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk outer central</th>\n",
       "      <td>0.25</td>\n",
       "      <td>0.59</td>\n",
       "      <td>0.54</td>\n",
       "      <td>0.68</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk outer inner</th>\n",
       "      <td>0.28</td>\n",
       "      <td>0.59</td>\n",
       "      <td>0.55</td>\n",
       "      <td>0.68</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore ExcessRisk outer outer</th>\n",
       "      <td>0.29</td>\n",
       "      <td>0.59</td>\n",
       "      <td>0.54</td>\n",
       "      <td>0.56</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk central central</th>\n",
       "      <td>0.26</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.36</td>\n",
       "      <td>0.35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk central inner</th>\n",
       "      <td>0.25</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.37</td>\n",
       "      <td>0.35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk central outer</th>\n",
       "      <td>0.26</td>\n",
       "      <td>0.32</td>\n",
       "      <td>0.39</td>\n",
       "      <td>0.31</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk inner central</th>\n",
       "      <td>0.23</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.29</td>\n",
       "      <td>0.35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk inner inner</th>\n",
       "      <td>0.23</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk inner outer</th>\n",
       "      <td>0.22</td>\n",
       "      <td>0.32</td>\n",
       "      <td>0.30</td>\n",
       "      <td>0.31</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk outer central</th>\n",
       "      <td>0.23</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.29</td>\n",
       "      <td>0.35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk outer inner</th>\n",
       "      <td>0.23</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.28</td>\n",
       "      <td>0.35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore TotalRisk outer outer</th>\n",
       "      <td>0.22</td>\n",
       "      <td>0.32</td>\n",
       "      <td>0.30</td>\n",
       "      <td>0.31</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore energy inner</th>\n",
       "      <td>0.23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>LogScore energy outer</th>\n",
       "      <td>0.24</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                        0     1     2     3\n",
       "LogScore BayesRisk central           0.26  0.28  0.36  0.35\n",
       "LogScore BayesRisk inner             0.23  0.28  0.28  0.35\n",
       "LogScore BayesRisk outer             0.24  0.27  0.26  0.27\n",
       "LogScore ExcessRisk central central  0.00  0.00  0.00  0.00\n",
       "LogScore ExcessRisk central inner    0.13  0.00  0.47  0.00\n",
       "LogScore ExcessRisk central outer    0.34  0.59  0.47  0.44\n",
       "LogScore ExcessRisk inner central    0.11  0.00  0.58  0.00\n",
       "LogScore ExcessRisk inner inner      0.00  0.00  0.00  0.00\n",
       "LogScore ExcessRisk inner outer      0.31  0.59  0.54  0.44\n",
       "LogScore ExcessRisk outer central    0.25  0.59  0.54  0.68\n",
       "LogScore ExcessRisk outer inner      0.28  0.59  0.55  0.68\n",
       "LogScore ExcessRisk outer outer      0.29  0.59  0.54  0.56\n",
       "LogScore TotalRisk central central   0.26  0.28  0.36  0.35\n",
       "LogScore TotalRisk central inner     0.25  0.28  0.37  0.35\n",
       "LogScore TotalRisk central outer     0.26  0.32  0.39  0.31\n",
       "LogScore TotalRisk inner central     0.23  0.28  0.29  0.35\n",
       "LogScore TotalRisk inner inner       0.23  0.28  0.28  0.35\n",
       "LogScore TotalRisk inner outer       0.22  0.32  0.30  0.31\n",
       "LogScore TotalRisk outer central     0.23  0.28  0.29  0.35\n",
       "LogScore TotalRisk outer inner       0.23  0.28  0.28  0.35\n",
       "LogScore TotalRisk outer outer       0.22  0.32  0.30  0.31\n",
       "LogScore energy inner                0.23   NaN   NaN   NaN\n",
       "LogScore energy outer                0.24   NaN   NaN   NaN"
      ]
     },
     "execution_count": 54,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "full_std_tab = full_std_tab.sort_index()\n",
    "full_std_tab"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 55,
   "id": "54fc83c5-18f3-4070-bec7-f359afa43dd6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lllll}\n",
      "\\toprule\n",
      " & 0 & 1 & 2 & 3 \\\\\n",
      "\\midrule\n",
      "LogScore BayesRisk central & 86.55 $\\pm$ 0.26 & 86.8 $\\pm$ 0.28 & 85.83 $\\pm$ 0.36 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore BayesRisk inner & 85.5 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.8 $\\pm$ 0.28 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore BayesRisk outer & 84.99 $\\pm$ 0.24 & 85.89 $\\pm$ 0.27 & 85.76 $\\pm$ 0.26 & 85.88 $\\pm$ 0.27 \\\\\n",
      "LogScore ExcessRisk central central & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 \\\\\n",
      "LogScore ExcessRisk central inner & 71.77 $\\pm$ 0.13 & 50.0 $\\pm$ 0.0 & 81.82 $\\pm$ 0.47 & 50.0 $\\pm$ 0.0 \\\\\n",
      "LogScore ExcessRisk central outer & 82.74 $\\pm$ 0.34 & 75.91 $\\pm$ 0.59 & 83.6 $\\pm$ 0.47 & 73.59 $\\pm$ 0.44 \\\\\n",
      "LogScore ExcessRisk inner central & 66.83 $\\pm$ 0.11 & 50.0 $\\pm$ 0.0 & 78.32 $\\pm$ 0.58 & 50.0 $\\pm$ 0.0 \\\\\n",
      "LogScore ExcessRisk inner inner & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 \\\\\n",
      "LogScore ExcessRisk inner outer & 80.18 $\\pm$ 0.31 & 75.91 $\\pm$ 0.59 & 79.62 $\\pm$ 0.54 & 73.59 $\\pm$ 0.44 \\\\\n",
      "LogScore ExcessRisk outer central & 79.25 $\\pm$ 0.25 & 75.91 $\\pm$ 0.59 & 80.73 $\\pm$ 0.54 & 79.52 $\\pm$ 0.68 \\\\\n",
      "LogScore ExcessRisk outer inner & 83.22 $\\pm$ 0.28 & 75.91 $\\pm$ 0.59 & 81.95 $\\pm$ 0.55 & 79.52 $\\pm$ 0.68 \\\\\n",
      "LogScore ExcessRisk outer outer & 81.33 $\\pm$ 0.29 & 75.91 $\\pm$ 0.59 & 81.02 $\\pm$ 0.54 & 76.78 $\\pm$ 0.56 \\\\\n",
      "LogScore TotalRisk central central & 86.55 $\\pm$ 0.26 & 86.8 $\\pm$ 0.28 & 85.83 $\\pm$ 0.36 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore TotalRisk central inner & 86.5 $\\pm$ 0.25 & 86.8 $\\pm$ 0.28 & 85.39 $\\pm$ 0.37 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore TotalRisk central outer & 86.65 $\\pm$ 0.26 & 86.4 $\\pm$ 0.32 & 85.43 $\\pm$ 0.39 & 86.95 $\\pm$ 0.31 \\\\\n",
      "LogScore TotalRisk inner central & 85.18 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.9 $\\pm$ 0.29 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore TotalRisk inner inner & 85.5 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.8 $\\pm$ 0.28 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore TotalRisk inner outer & 85.58 $\\pm$ 0.22 & 86.4 $\\pm$ 0.32 & 86.92 $\\pm$ 0.3 & 86.95 $\\pm$ 0.31 \\\\\n",
      "LogScore TotalRisk outer central & 85.18 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.9 $\\pm$ 0.29 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore TotalRisk outer inner & 85.5 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.8 $\\pm$ 0.28 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore TotalRisk outer outer & 85.58 $\\pm$ 0.22 & 86.4 $\\pm$ 0.32 & 86.92 $\\pm$ 0.3 & 86.95 $\\pm$ 0.31 \\\\\n",
      "LogScore energy inner & 83.34 $\\pm$ 0.23 & nan $\\pm$ nan & nan $\\pm$ nan & nan $\\pm$ nan \\\\\n",
      "LogScore energy outer & 82.4 $\\pm$ 0.24 & nan $\\pm$ nan & nan $\\pm$ nan & nan $\\pm$ nan \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    }
   ],
   "source": [
    "# Merge the mean and std tables based on their index to create a combined LaTeX table.\n",
    "merged_table = full_mean_tab.round(3).copy()\n",
    "\n",
    "# For each numeric column, combine the mean and std in the format: mean \\pm std\n",
    "for col in full_mean_tab.columns:\n",
    "    merged_table[col] = full_mean_tab.round(3)[col].astype(str) + \" $\\\\pm$ \" + full_std_tab[col].round(3).astype(str)\n",
    "\n",
    "# Create LaTeX format\n",
    "latex_table = merged_table.to_latex(index=True, escape=False, float_format=\"%.2f\")\n",
    "\n",
    "# Output the resulting LaTeX table for the user\n",
    "print(latex_table)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "id": "fe53aff8-0507-47db-b921-2f5e3c0f459d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lllll}\n",
      "\\toprule\n",
      " & 0 & 1 & 2 & 3 \\\\\n",
      "\\midrule\n",
      "LogScore \\(\\Rtildebayes^{(3)}\\) & 86.55 $\\pm$ 0.26 & 86.8 $\\pm$ 0.28 & 85.83 $\\pm$ 0.36 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore \\(\\Rtildebayes^{(2)}\\) & 85.5 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.8 $\\pm$ 0.28 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore \\(\\Rtildebayes^{(1)}\\) & 84.99 $\\pm$ 0.24 & 85.89 $\\pm$ 0.27 & 85.76 $\\pm$ 0.26 & 85.88 $\\pm$ 0.27 \\\\\n",
      "LogScore \\(\\Rtildeexc^{(3, 3)}\\) & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 \\\\\n",
      "LogScore \\(\\Rtildeexc^{(3, 2)}\\) & 71.77 $\\pm$ 0.13 & 50.0 $\\pm$ 0.0 & 81.82 $\\pm$ 0.47 & 50.0 $\\pm$ 0.0 \\\\\n",
      "LogScore \\(\\Rtildeexc^{(3, 1)}\\) & 82.74 $\\pm$ 0.34 & 75.91 $\\pm$ 0.59 & 83.6 $\\pm$ 0.47 & 73.59 $\\pm$ 0.44 \\\\\n",
      "LogScore \\(\\Rtildeexc^{(2, 3)}\\) & 66.83 $\\pm$ 0.11 & 50.0 $\\pm$ 0.0 & 78.32 $\\pm$ 0.58 & 50.0 $\\pm$ 0.0 \\\\\n",
      "LogScore \\(\\Rtildeexc^{(2, 2)}\\) & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 & 50.0 $\\pm$ 0.0 \\\\\n",
      "LogScore \\(\\Rtildeexc^{(2, 1)}\\) & 80.18 $\\pm$ 0.31 & 75.91 $\\pm$ 0.59 & 79.62 $\\pm$ 0.54 & 73.59 $\\pm$ 0.44 \\\\\n",
      "LogScore \\(\\Rtildeexc^{(1, 3)}\\) & 79.25 $\\pm$ 0.25 & 75.91 $\\pm$ 0.59 & 80.73 $\\pm$ 0.54 & 79.52 $\\pm$ 0.68 \\\\\n",
      "LogScore \\(\\Rtildeexc^{(1, 2)}\\) & 83.22 $\\pm$ 0.28 & 75.91 $\\pm$ 0.59 & 81.95 $\\pm$ 0.55 & 79.52 $\\pm$ 0.68 \\\\\n",
      "LogScore \\(\\Rtildeexc^{(1, 1)}\\) & 81.33 $\\pm$ 0.29 & 75.91 $\\pm$ 0.59 & 81.02 $\\pm$ 0.54 & 76.78 $\\pm$ 0.56 \\\\\n",
      "LogScore \\(\\Rtildetot^{(3, 3)}\\) & 86.55 $\\pm$ 0.26 & 86.8 $\\pm$ 0.28 & 85.83 $\\pm$ 0.36 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore \\(\\Rtildetot^{(3, 2)}\\) & 86.5 $\\pm$ 0.25 & 86.8 $\\pm$ 0.28 & 85.39 $\\pm$ 0.37 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore \\(\\Rtildetot^{(3, 1)}\\) & 86.65 $\\pm$ 0.26 & 86.4 $\\pm$ 0.32 & 85.43 $\\pm$ 0.39 & 86.95 $\\pm$ 0.31 \\\\\n",
      "LogScore \\(\\Rtildetot^{(2, 3)}\\) & 85.18 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.9 $\\pm$ 0.29 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore \\(\\Rtildetot^{(2, 2)}\\) & 85.5 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.8 $\\pm$ 0.28 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore \\(\\Rtildetot^{(2, 1)}\\) & 85.58 $\\pm$ 0.22 & 86.4 $\\pm$ 0.32 & 86.92 $\\pm$ 0.3 & 86.95 $\\pm$ 0.31 \\\\\n",
      "LogScore \\(\\Rtildetot^{(1, 3)}\\) & 85.18 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.9 $\\pm$ 0.29 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore \\(\\Rtildetot^{(1, 2)}\\) & 85.5 $\\pm$ 0.23 & 86.8 $\\pm$ 0.28 & 86.8 $\\pm$ 0.28 & 87.23 $\\pm$ 0.35 \\\\\n",
      "LogScore \\(\\Rtildetot^{(1, 1)}\\) & 85.58 $\\pm$ 0.22 & 86.4 $\\pm$ 0.32 & 86.92 $\\pm$ 0.3 & 86.95 $\\pm$ 0.31 \\\\\n",
      "LogScore \\( E(x;\\E_{\\theta}f_{\\theta}) \\) & 83.34 $\\pm$ 0.23 & nan $\\pm$ nan & nan $\\pm$ nan & nan $\\pm$ nan \\\\\n",
      "LogScore \\( \\E_{\\theta} E(x;f_{\\theta}) \\) & 82.4 $\\pm$ 0.24 & nan $\\pm$ nan & nan $\\pm$ nan & nan $\\pm$ nan \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    }
   ],
   "source": [
    "replace_dictionary = {\n",
    "    \"BayesRisk central\": r\"\\(\\Rtildebayes^{(3)}\\)\",\n",
    "    \"BayesRisk inner\": r\"\\(\\Rtildebayes^{(2)}\\)\",\n",
    "    \"BayesRisk outer\": r\"\\(\\Rtildebayes^{(1)}\\)\",\n",
    "    \"ExcessRisk central central\": r\"\\(\\Rtildeexc^{(3, 3)}\\)\",\n",
    "    \"ExcessRisk central inner\": r\"\\(\\Rtildeexc^{(3, 2)}\\)\",\n",
    "    \"ExcessRisk central outer\": r\"\\(\\Rtildeexc^{(3, 1)}\\)\",\n",
    "    \"ExcessRisk inner central\": r\"\\(\\Rtildeexc^{(2, 3)}\\)\",\n",
    "    \"ExcessRisk inner inner\": r\"\\(\\Rtildeexc^{(2, 2)}\\)\",\n",
    "    \"ExcessRisk inner outer\": r\"\\(\\Rtildeexc^{(2, 1)}\\)\",\n",
    "    \"ExcessRisk outer central\": r\"\\(\\Rtildeexc^{(1, 3)}\\)\",\n",
    "    \"ExcessRisk outer inner\": r\"\\(\\Rtildeexc^{(1, 2)}\\)\",\n",
    "    \"ExcessRisk outer outer\": r\"\\(\\Rtildeexc^{(1, 1)}\\)\",\n",
    "    \"TotalRisk central central\": r\"\\(\\Rtildetot^{(3, 3)}\\)\",\n",
    "    \"TotalRisk central inner\": r\"\\(\\Rtildetot^{(3, 2)}\\)\",\n",
    "    \"TotalRisk central outer\": r\"\\(\\Rtildetot^{(3, 1)}\\)\",\n",
    "    \"TotalRisk inner central\": r\"\\(\\Rtildetot^{(2, 3)}\\)\",\n",
    "    \"TotalRisk inner inner\": r\"\\(\\Rtildetot^{(2, 2)}\\)\",\n",
    "    \"TotalRisk inner outer\": r\"\\(\\Rtildetot^{(2, 1)}\\)\",\n",
    "    \"TotalRisk outer central\": r\"\\(\\Rtildetot^{(1, 3)}\\)\",\n",
    "    \"TotalRisk outer inner\": r\"\\(\\Rtildetot^{(1, 2)}\\)\",\n",
    "    \"TotalRisk outer outer\": r\"\\(\\Rtildetot^{(1, 1)}\\)\",\n",
    "    \"energy inner\": r\"\\( E(x;\\E_{\\theta}f_{\\theta}) \\)\",\n",
    "    \"energy outer\": r\"\\( \\E_{\\theta} E(x;f_{\\theta}) \\)\",\n",
    "    \n",
    "} \n",
    "for key in replace_dictionary.keys():\n",
    "    latex_table = latex_table.replace(key, replace_dictionary[key])\n",
    "\n",
    "print(latex_table)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "76763e52-54a5-4db6-928a-4c053a415d03",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e68606d5-0594-43be-8609-7b09bc9aea88",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e9f21114-edb2-4b74-bfb7-141be7f829d3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "47a3e2e9-df62-4517-95b9-ec0a37c26f05",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1cad8705-bba4-463a-a586-b596580a1e88",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ad4390c7-b1ba-4645-8bda-31313031df84",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7a23a47a-7f4a-41b2-81c1-c71a56b947a6",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "bdc41421-998b-42e8-a095-1c741dc0cc85",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "aca6c2aa-49b5-4e32-b088-85eac56bb232",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "edeeb685-ae3a-48f5-ad49-062e4e031def",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f087165e-3411-41d7-a689-1c9d1f3757db",
   "metadata": {},
   "outputs": [],
   "source": [
    "full_mis_rocauc = full_mis_rocauc[~full_mis_rocauc.UQMetric.str.endswith(\"Inner Inner\")]\n",
    "\n",
    "full_mis_rocauc.loc[\n",
    "    (full_mis_rocauc.RiskType == \"Bayes\")\n",
    "    & full_mis_rocauc.UQMetric.str.endswith(\"Outer\"),\n",
    "    \"RiskType\",\n",
    "] = \"Bayes Outer\"\n",
    "full_mis_rocauc.loc[\n",
    "    (full_mis_rocauc.RiskType == \"Bayes\")\n",
    "    & full_mis_rocauc.UQMetric.str.endswith(\"Inner\"),\n",
    "    \"RiskType\",\n",
    "] = \"Bayes Inner\"\n",
    "\n",
    "full_mis_rocauc.loc[\n",
    "    (full_mis_rocauc.RiskType == \"Total\")\n",
    "    & full_mis_rocauc.UQMetric.str.endswith(\"Outer\"),\n",
    "    \"RiskType\",\n",
    "] = \"Total Outer\"\n",
    "full_mis_rocauc.loc[\n",
    "    (full_mis_rocauc.RiskType == \"Total\")\n",
    "    & full_mis_rocauc.UQMetric.str.endswith(\"Inner\"),\n",
    "    \"RiskType\",\n",
    "] = \"Total Inner\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2766ad9e-e869-43d6-a767-1538d4de2e2f",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "# trunc_df = full_mis_rocauc[\n",
    "# ~full_mis_rocauc.RiskType.isin(['Bias', 'MV', 'MVBI', 'BiasBI', 'Bregman Information', 'Reverse Bregman Information'])\n",
    "# # full_mis_rocauc.base_rule.isin(['Brier', 'Logscore', 'Spherical']) &\n",
    "# # full_mis_rocauc.LossFunction.isin(['Brier', 'Logscore', 'Spherical']) &\n",
    "# # ~(np.isclose(full_mis_rocauc.RocAucScore, np.float64(0.5)))\n",
    "# ]\n",
    "\n",
    "# # trunc_df.sort_values(by='RocAucScore')\n",
    "\n",
    "# trunc_df.to_csv(os.path.join('tables', 'full_mis_rocauc_only_risks.csv'), index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c3124af6-13d5-4195-b50c-418b2f120d02",
   "metadata": {},
   "outputs": [],
   "source": [
    "grouped_df = extract_same_different_dataframes(\n",
    "    dataframe_=full_mis_rocauc,\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ab932668-3483-4e74-b542-5ae9f4c83c7f",
   "metadata": {},
   "outputs": [],
   "source": [
    "same_dict, _ = collect_scores_into_dict_miss(\n",
    "    dataframes_list_=[\n",
    "        grouped_df.logscore_logscore,\n",
    "        grouped_df.brier_brier,\n",
    "        grouped_df.spherical_spherical,\n",
    "    ],\n",
    ")\n",
    "same_df = pd.DataFrame.from_dict(same_dict)\n",
    "\n",
    "same_agg_df = aggregate_over_measures(\n",
    "    dataframe_=same_df,\n",
    "    agg_func_=\"mean\",\n",
    "    by_=[\"InD\"],\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "509ec612-1455-4cff-9c39-d4f128178a72",
   "metadata": {},
   "outputs": [],
   "source": [
    "different_dict, _ = collect_scores_into_dict_miss(\n",
    "    dataframes_list_=[\n",
    "        grouped_df.logscore_not_logscore,\n",
    "        grouped_df.brier_not_brier,\n",
    "        grouped_df.spherical_not_spherical,\n",
    "    ],\n",
    ")\n",
    "different_df = pd.DataFrame.from_dict(different_dict)\n",
    "\n",
    "different_agg_df = aggregate_over_measures(\n",
    "    dataframe_=different_df,\n",
    "    agg_func_=\"mean\",\n",
    "    by_=[\"InD\"],\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3d52cb31-1c25-4655-88e9-1c12286643aa",
   "metadata": {},
   "outputs": [],
   "source": [
    "all_dict, _ = collect_scores_into_dict_miss(\n",
    "    dataframes_list_=[\n",
    "        full_mis_rocauc,\n",
    "    ],\n",
    ")\n",
    "all_df = pd.DataFrame.from_dict(all_dict)\n",
    "\n",
    "all_agg_df = aggregate_over_measures(\n",
    "    dataframe_=all_df,\n",
    "    agg_func_=\"mean\",\n",
    "    by_=[\"InD\"],\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "59281968-84ab-48d7-b5b5-d678ab8d97aa",
   "metadata": {},
   "outputs": [],
   "source": [
    "display(all_agg_df)\n",
    "display(same_agg_df)\n",
    "display(different_agg_df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "57cd4d55-112b-44b9-a795-a4fee6103d45",
   "metadata": {},
   "outputs": [],
   "source": [
    "same_agg_df.index"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fe7364a1-4b3d-480c-a812-77874c1b3af6",
   "metadata": {},
   "outputs": [],
   "source": [
    "def enhance_latex_table(input_latex):\n",
    "    lines = input_latex.split(\"\\n\")\n",
    "    enhanced_lines = []\n",
    "\n",
    "    for i, line in enumerate(lines):\n",
    "        if \"\\\\toprule\" in line:\n",
    "            # Add multicolumn headers\n",
    "            enhanced_lines.append(line)\n",
    "            enhanced_lines.append(\n",
    "                r\"\\multicolumn{2}{c}{Dataset} & \\multicolumn{5}{c}{Metrics} \\\\\"\n",
    "            )\n",
    "            enhanced_lines.append(r\"\\cmidrule(lr){1-2} \\cmidrule(lr){3-7}\")\n",
    "            continue\n",
    "\n",
    "        # Add row coloring\n",
    "        if \"\\\\midrule\" in line:\n",
    "            enhanced_lines.append(line)\n",
    "            enhanced_lines.append(r\"\\rowcolor{gray!10}\")\n",
    "        elif \"\\\\bottomrule\" in line:\n",
    "            enhanced_lines.append(r\"\\end{tabular}\")\n",
    "        else:\n",
    "            enhanced_lines.append(line)\n",
    "\n",
    "    return \"\\n\".join(enhanced_lines)\n",
    "\n",
    "\n",
    "def get_nice_df(df_):\n",
    "    df_.index = pd.Index(\n",
    "        data=[\n",
    "            \"CIFAR10\",\n",
    "            \"CIFAR100\",\n",
    "            \"Missed class CIFAR10\",\n",
    "            \"Noisy CIFAR10\",\n",
    "            \"Noisy CIFAR100\",\n",
    "        ],\n",
    "        name=\"InD\",\n",
    "    )\n",
    "    df_.columns = [\n",
    "        # 'Bayes',\n",
    "        # 'Excess',\n",
    "        # 'Total',\n",
    "        \"Bayes(O)\",\n",
    "        \"Bayes(I)\",\n",
    "        \"Total(O)\",\n",
    "        \"Total(I)\",\n",
    "        \"BI\",\n",
    "        \"RBI\",\n",
    "        \"EPBI\",\n",
    "        # 'Bias',\n",
    "        # 'MV',\n",
    "        # 'MVBI',\n",
    "        # 'BiasBI',\n",
    "    ]\n",
    "    # df_ = df_[['Bayes', 'Excess', 'Total', 'BI', 'RBI']]\n",
    "    df_ = (100 * df_).round(2)\n",
    "\n",
    "    display(df_)\n",
    "\n",
    "    return df_, df_.to_latex(float_format=\"%.2f\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0f22c426-53c8-4735-92f1-1af2ea06fe61",
   "metadata": {},
   "outputs": [],
   "source": [
    "measures = [\n",
    "    \"Bayes Outer\",\n",
    "    \"Bayes Inner\",\n",
    "    \"Total Outer\",\n",
    "    \"Total Inner\",\n",
    "    \"Bregman Information\",\n",
    "    \"Reverse Bregman Information\",\n",
    "    \"Expected Pairwise Bregman Information\",\n",
    "]\n",
    "\n",
    "# measures = ['Bayes', 'Excess', 'Total', 'Bregman Information', 'Reverse Bregman Information', 'Expected Pairwise Bregman Information']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2cd94a7d-6c37-49dc-b97a-1b8000c3161d",
   "metadata": {},
   "outputs": [],
   "source": [
    "nice_same = get_nice_df(same_agg_df.copy()[measures])\n",
    "print(enhance_latex_table(nice_same[1]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8313933e-30cc-4ed2-9421-c0f23a9fbfed",
   "metadata": {},
   "outputs": [],
   "source": [
    "nice_different = get_nice_df(different_agg_df.copy()[measures])\n",
    "print(enhance_latex_table(nice_different[1]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c07fdff8-268c-4ad0-9075-0809f4c0c095",
   "metadata": {},
   "outputs": [],
   "source": [
    "print(\n",
    "    enhance_latex_table(\n",
    "        pd.concat([nice_same[0], nice_different[0]], axis=1).to_latex(\n",
    "            float_format=\"%.2f\"\n",
    "        )\n",
    "    )\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d981c020-496e-45b5-8b38-804dd7a55fd8",
   "metadata": {},
   "outputs": [],
   "source": [
    "nice_same[0].mean()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "905661a5-5faf-4b0e-8e24-fa5e8f89a66b",
   "metadata": {},
   "outputs": [],
   "source": [
    "nice_same[0].std()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "952aef89-6a01-4cab-8f86-6101663ea673",
   "metadata": {},
   "outputs": [],
   "source": [
    "nice_different[0].mean()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "14e0dc7d-a5bf-40f5-9c79-5aa899e790e4",
   "metadata": {},
   "outputs": [],
   "source": [
    "nice_different[0].std()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "350fd577-0c2b-4dd9-bdd3-a090202e927c",
   "metadata": {},
   "outputs": [],
   "source": [
    "same_agg_df.eq(same_agg_df.max(axis=1), axis=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6808ec30-e50e-4ca1-8a31-1011a2ac7246",
   "metadata": {},
   "outputs": [],
   "source": [
    "different_agg_df.eq(different_agg_df.max(axis=1), axis=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9cb57da5-48b0-463d-85b9-61de7fa6084e",
   "metadata": {},
   "outputs": [],
   "source": [
    "all_agg_df.eq(all_agg_df.max(axis=1), axis=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ac98d379-05e3-4a33-b2e3-c96fbdfb61d3",
   "metadata": {},
   "outputs": [],
   "source": [
    "(same_agg_df - different_agg_df) > 0"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
