{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import copy \n",
    "import os\n",
    "import re\n",
    "from collections import OrderedDict\n",
    "from pprint import pprint\n",
    "import itertools"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>calib_conf</th>\n",
       "      <th>training_conf</th>\n",
       "      <th>C_1</th>\n",
       "      <th>N_t</th>\n",
       "      <th>N_v</th>\n",
       "      <th>N_hyp_v</th>\n",
       "      <th>Auto-Labeling-Err-Mean</th>\n",
       "      <th>Coverage-Mean</th>\n",
       "      <th>Avg-ECE-Val-Mean</th>\n",
       "      <th>Auto-Labeling-Err-Std</th>\n",
       "      <th>...</th>\n",
       "      <th>training_conf.optimizer</th>\n",
       "      <th>training_conf.reg</th>\n",
       "      <th>training_conf.weight_decay</th>\n",
       "      <th>training_conf_g.batch_size</th>\n",
       "      <th>training_conf_g.max_epochs</th>\n",
       "      <th>training_conf_g.optimizer</th>\n",
       "      <th>training_conf_g.weight_decay</th>\n",
       "      <th>weight_decay</th>\n",
       "      <th>rank_target</th>\n",
       "      <th>rank_weight</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>auto_label_opt_v0</td>\n",
       "      <td>squentropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>2.3387</td>\n",
       "      <td>79.0495</td>\n",
       "      <td>10.2829</td>\n",
       "      <td>0.5167</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>500.0</td>\n",
       "      <td>adam</td>\n",
       "      <td>0.01</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>auto_label_opt_v0</td>\n",
       "      <td>std_cross_entropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>2.9666</td>\n",
       "      <td>78.4820</td>\n",
       "      <td>16.0513</td>\n",
       "      <td>0.2031</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>500.0</td>\n",
       "      <td>adam</td>\n",
       "      <td>0.10</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>auto_label_opt_v0</td>\n",
       "      <td>crl</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>2.2377</td>\n",
       "      <td>77.8595</td>\n",
       "      <td>22.8733</td>\n",
       "      <td>0.6454</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>500.0</td>\n",
       "      <td>adam</td>\n",
       "      <td>0.01</td>\n",
       "      <td>0.010</td>\n",
       "      <td>softmax</td>\n",
       "      <td>0.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>auto_label_opt_v0</td>\n",
       "      <td>fmfp</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>3.0204</td>\n",
       "      <td>77.4455</td>\n",
       "      <td>14.6882</td>\n",
       "      <td>0.4308</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>500.0</td>\n",
       "      <td>adam</td>\n",
       "      <td>0.01</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>dirichlet</td>\n",
       "      <td>squentropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>7.3309</td>\n",
       "      <td>29.3665</td>\n",
       "      <td>13.4658</td>\n",
       "      <td>0.3071</td>\n",
       "      <td>...</td>\n",
       "      <td>adam</td>\n",
       "      <td>0.01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>temp_scaling</td>\n",
       "      <td>squentropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>6.9471</td>\n",
       "      <td>28.1660</td>\n",
       "      <td>13.7981</td>\n",
       "      <td>0.5826</td>\n",
       "      <td>...</td>\n",
       "      <td>adam</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>scaling_binning</td>\n",
       "      <td>squentropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>6.1907</td>\n",
       "      <td>23.7565</td>\n",
       "      <td>13.3403</td>\n",
       "      <td>0.4242</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>temp_scaling</td>\n",
       "      <td>std_cross_entropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>7.2664</td>\n",
       "      <td>23.1570</td>\n",
       "      <td>16.9683</td>\n",
       "      <td>0.2994</td>\n",
       "      <td>...</td>\n",
       "      <td>adam</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>dirichlet</td>\n",
       "      <td>std_cross_entropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>7.6810</td>\n",
       "      <td>22.3685</td>\n",
       "      <td>4.0057</td>\n",
       "      <td>0.4806</td>\n",
       "      <td>...</td>\n",
       "      <td>adam</td>\n",
       "      <td>0.10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>dirichlet</td>\n",
       "      <td>fmfp</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>6.9052</td>\n",
       "      <td>21.6735</td>\n",
       "      <td>3.7992</td>\n",
       "      <td>0.3577</td>\n",
       "      <td>...</td>\n",
       "      <td>adam</td>\n",
       "      <td>0.01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>None</td>\n",
       "      <td>squentropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>5.1711</td>\n",
       "      <td>21.1660</td>\n",
       "      <td>14.8103</td>\n",
       "      <td>0.4979</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>temp_scaling</td>\n",
       "      <td>fmfp</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>6.5359</td>\n",
       "      <td>21.0035</td>\n",
       "      <td>19.7062</td>\n",
       "      <td>0.2837</td>\n",
       "      <td>...</td>\n",
       "      <td>adam</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.00</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>dirichlet</td>\n",
       "      <td>crl</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>7.7379</td>\n",
       "      <td>20.8665</td>\n",
       "      <td>7.4916</td>\n",
       "      <td>0.1524</td>\n",
       "      <td>...</td>\n",
       "      <td>adam</td>\n",
       "      <td>0.10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.010</td>\n",
       "      <td>softmax</td>\n",
       "      <td>0.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>temp_scaling</td>\n",
       "      <td>crl</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>6.8317</td>\n",
       "      <td>20.3230</td>\n",
       "      <td>11.2382</td>\n",
       "      <td>0.8033</td>\n",
       "      <td>...</td>\n",
       "      <td>adam</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.010</td>\n",
       "      <td>softmax</td>\n",
       "      <td>0.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>scaling_binning</td>\n",
       "      <td>fmfp</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>6.1295</td>\n",
       "      <td>19.5350</td>\n",
       "      <td>19.1732</td>\n",
       "      <td>0.4801</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.00</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>scaling_binning</td>\n",
       "      <td>std_cross_entropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>6.0905</td>\n",
       "      <td>18.5820</td>\n",
       "      <td>7.4021</td>\n",
       "      <td>0.3512</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>scaling_binning</td>\n",
       "      <td>crl</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>5.9342</td>\n",
       "      <td>17.8700</td>\n",
       "      <td>10.6656</td>\n",
       "      <td>0.8505</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.010</td>\n",
       "      <td>softmax</td>\n",
       "      <td>0.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>None</td>\n",
       "      <td>crl</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>5.1797</td>\n",
       "      <td>15.8780</td>\n",
       "      <td>27.3655</td>\n",
       "      <td>0.2672</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.010</td>\n",
       "      <td>softmax</td>\n",
       "      <td>0.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>histogram_binning_top_label</td>\n",
       "      <td>squentropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>4.2511</td>\n",
       "      <td>15.8025</td>\n",
       "      <td>2.6350</td>\n",
       "      <td>0.4610</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>histogram_binning_top_label</td>\n",
       "      <td>std_cross_entropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>5.9598</td>\n",
       "      <td>15.5885</td>\n",
       "      <td>3.8193</td>\n",
       "      <td>0.7059</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>None</td>\n",
       "      <td>fmfp</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>4.9255</td>\n",
       "      <td>15.5705</td>\n",
       "      <td>20.3418</td>\n",
       "      <td>0.4446</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>histogram_binning_top_label</td>\n",
       "      <td>fmfp</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>5.1666</td>\n",
       "      <td>14.1700</td>\n",
       "      <td>3.7075</td>\n",
       "      <td>0.5321</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>None</td>\n",
       "      <td>std_cross_entropy</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>4.7882</td>\n",
       "      <td>14.0100</td>\n",
       "      <td>32.4883</td>\n",
       "      <td>0.2198</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>histogram_binning_top_label</td>\n",
       "      <td>crl</td>\n",
       "      <td>0.25</td>\n",
       "      <td>10000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2000</td>\n",
       "      <td>4.3772</td>\n",
       "      <td>12.2995</td>\n",
       "      <td>2.5828</td>\n",
       "      <td>0.5434</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.010</td>\n",
       "      <td>softmax</td>\n",
       "      <td>0.8</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>24 rows × 47 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    calib_conf      training_conf   C_1    N_t   N_v  N_hyp_v  \\\n",
       "1            auto_label_opt_v0         squentropy  0.25  10000  8000     2000   \n",
       "1            auto_label_opt_v0  std_cross_entropy  0.25  10000  8000     2000   \n",
       "1            auto_label_opt_v0                crl  0.25  10000  8000     2000   \n",
       "1            auto_label_opt_v0               fmfp  0.25  10000  8000     2000   \n",
       "2                    dirichlet         squentropy  0.25  10000  8000     2000   \n",
       "5                 temp_scaling         squentropy  0.25  10000  8000     2000   \n",
       "4              scaling_binning         squentropy  0.25  10000  8000     2000   \n",
       "5                 temp_scaling  std_cross_entropy  0.25  10000  8000     2000   \n",
       "2                    dirichlet  std_cross_entropy  0.25  10000  8000     2000   \n",
       "2                    dirichlet               fmfp  0.25  10000  8000     2000   \n",
       "0                         None         squentropy  0.25  10000  8000     2000   \n",
       "5                 temp_scaling               fmfp  0.25  10000  8000     2000   \n",
       "2                    dirichlet                crl  0.25  10000  8000     2000   \n",
       "5                 temp_scaling                crl  0.25  10000  8000     2000   \n",
       "4              scaling_binning               fmfp  0.25  10000  8000     2000   \n",
       "4              scaling_binning  std_cross_entropy  0.25  10000  8000     2000   \n",
       "4              scaling_binning                crl  0.25  10000  8000     2000   \n",
       "0                         None                crl  0.25  10000  8000     2000   \n",
       "3  histogram_binning_top_label         squentropy  0.25  10000  8000     2000   \n",
       "3  histogram_binning_top_label  std_cross_entropy  0.25  10000  8000     2000   \n",
       "0                         None               fmfp  0.25  10000  8000     2000   \n",
       "3  histogram_binning_top_label               fmfp  0.25  10000  8000     2000   \n",
       "0                         None  std_cross_entropy  0.25  10000  8000     2000   \n",
       "3  histogram_binning_top_label                crl  0.25  10000  8000     2000   \n",
       "\n",
       "   Auto-Labeling-Err-Mean  Coverage-Mean  Avg-ECE-Val-Mean  \\\n",
       "1                  2.3387        79.0495           10.2829   \n",
       "1                  2.9666        78.4820           16.0513   \n",
       "1                  2.2377        77.8595           22.8733   \n",
       "1                  3.0204        77.4455           14.6882   \n",
       "2                  7.3309        29.3665           13.4658   \n",
       "5                  6.9471        28.1660           13.7981   \n",
       "4                  6.1907        23.7565           13.3403   \n",
       "5                  7.2664        23.1570           16.9683   \n",
       "2                  7.6810        22.3685            4.0057   \n",
       "2                  6.9052        21.6735            3.7992   \n",
       "0                  5.1711        21.1660           14.8103   \n",
       "5                  6.5359        21.0035           19.7062   \n",
       "2                  7.7379        20.8665            7.4916   \n",
       "5                  6.8317        20.3230           11.2382   \n",
       "4                  6.1295        19.5350           19.1732   \n",
       "4                  6.0905        18.5820            7.4021   \n",
       "4                  5.9342        17.8700           10.6656   \n",
       "0                  5.1797        15.8780           27.3655   \n",
       "3                  4.2511        15.8025            2.6350   \n",
       "3                  5.9598        15.5885            3.8193   \n",
       "0                  4.9255        15.5705           20.3418   \n",
       "3                  5.1666        14.1700            3.7075   \n",
       "0                  4.7882        14.0100           32.4883   \n",
       "3                  4.3772        12.2995            2.5828   \n",
       "\n",
       "   Auto-Labeling-Err-Std  ...  training_conf.optimizer  training_conf.reg  \\\n",
       "1                 0.5167  ...                      NaN                NaN   \n",
       "1                 0.2031  ...                      NaN                NaN   \n",
       "1                 0.6454  ...                      NaN                NaN   \n",
       "1                 0.4308  ...                      NaN                NaN   \n",
       "2                 0.3071  ...                     adam               0.01   \n",
       "5                 0.5826  ...                     adam                NaN   \n",
       "4                 0.4242  ...                      NaN                NaN   \n",
       "5                 0.2994  ...                     adam                NaN   \n",
       "2                 0.4806  ...                     adam               0.10   \n",
       "2                 0.3577  ...                     adam               0.01   \n",
       "0                 0.4979  ...                      NaN                NaN   \n",
       "5                 0.2837  ...                     adam                NaN   \n",
       "2                 0.1524  ...                     adam               0.10   \n",
       "5                 0.8033  ...                     adam                NaN   \n",
       "4                 0.4801  ...                      NaN                NaN   \n",
       "4                 0.3512  ...                      NaN                NaN   \n",
       "4                 0.8505  ...                      NaN                NaN   \n",
       "0                 0.2672  ...                      NaN                NaN   \n",
       "3                 0.4610  ...                      NaN                NaN   \n",
       "3                 0.7059  ...                      NaN                NaN   \n",
       "0                 0.4446  ...                      NaN                NaN   \n",
       "3                 0.5321  ...                      NaN                NaN   \n",
       "0                 0.2198  ...                      NaN                NaN   \n",
       "3                 0.5434  ...                      NaN                NaN   \n",
       "\n",
       "   training_conf.weight_decay  training_conf_g.batch_size  \\\n",
       "1                         NaN                        64.0   \n",
       "1                         NaN                        64.0   \n",
       "1                         NaN                        64.0   \n",
       "1                         NaN                        64.0   \n",
       "2                         NaN                         NaN   \n",
       "5                        0.01                         NaN   \n",
       "4                        0.01                         NaN   \n",
       "5                        0.10                         NaN   \n",
       "2                         NaN                         NaN   \n",
       "2                         NaN                         NaN   \n",
       "0                         NaN                         NaN   \n",
       "5                        1.00                         NaN   \n",
       "2                         NaN                         NaN   \n",
       "5                        0.10                         NaN   \n",
       "4                        1.00                         NaN   \n",
       "4                        0.01                         NaN   \n",
       "4                        0.10                         NaN   \n",
       "0                         NaN                         NaN   \n",
       "3                         NaN                         NaN   \n",
       "3                         NaN                         NaN   \n",
       "0                         NaN                         NaN   \n",
       "3                         NaN                         NaN   \n",
       "0                         NaN                         NaN   \n",
       "3                         NaN                         NaN   \n",
       "\n",
       "   training_conf_g.max_epochs training_conf_g.optimizer  \\\n",
       "1                       500.0                      adam   \n",
       "1                       500.0                      adam   \n",
       "1                       500.0                      adam   \n",
       "1                       500.0                      adam   \n",
       "2                         NaN                       NaN   \n",
       "5                         NaN                       NaN   \n",
       "4                         NaN                       NaN   \n",
       "5                         NaN                       NaN   \n",
       "2                         NaN                       NaN   \n",
       "2                         NaN                       NaN   \n",
       "0                         NaN                       NaN   \n",
       "5                         NaN                       NaN   \n",
       "2                         NaN                       NaN   \n",
       "5                         NaN                       NaN   \n",
       "4                         NaN                       NaN   \n",
       "4                         NaN                       NaN   \n",
       "4                         NaN                       NaN   \n",
       "0                         NaN                       NaN   \n",
       "3                         NaN                       NaN   \n",
       "3                         NaN                       NaN   \n",
       "0                         NaN                       NaN   \n",
       "3                         NaN                       NaN   \n",
       "0                         NaN                       NaN   \n",
       "3                         NaN                       NaN   \n",
       "\n",
       "   training_conf_g.weight_decay weight_decay  rank_target  rank_weight  \n",
       "1                          0.01        0.001          NaN          NaN  \n",
       "1                          0.10        0.001          NaN          NaN  \n",
       "1                          0.01        0.010      softmax          0.8  \n",
       "1                          0.01        0.001          NaN          NaN  \n",
       "2                           NaN        0.001          NaN          NaN  \n",
       "5                           NaN        0.001          NaN          NaN  \n",
       "4                           NaN        0.001          NaN          NaN  \n",
       "5                           NaN        0.001          NaN          NaN  \n",
       "2                           NaN        0.001          NaN          NaN  \n",
       "2                           NaN        0.001          NaN          NaN  \n",
       "0                           NaN        0.001          NaN          NaN  \n",
       "5                           NaN        0.001          NaN          NaN  \n",
       "2                           NaN        0.010      softmax          0.8  \n",
       "5                           NaN        0.010      softmax          0.8  \n",
       "4                           NaN        0.001          NaN          NaN  \n",
       "4                           NaN        0.001          NaN          NaN  \n",
       "4                           NaN        0.010      softmax          0.8  \n",
       "0                           NaN        0.010      softmax          0.8  \n",
       "3                           NaN        0.001          NaN          NaN  \n",
       "3                           NaN        0.001          NaN          NaN  \n",
       "0                           NaN        0.001          NaN          NaN  \n",
       "3                           NaN        0.001          NaN          NaN  \n",
       "0                           NaN        0.001          NaN          NaN  \n",
       "3                           NaN        0.010      softmax          0.8  \n",
       "\n",
       "[24 rows x 47 columns]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "data_models = ['cifar10', 'mnist', 'twenty_newsgroups','tinyimagenet100']\n",
    "dm_identifier = {'cifar10': 'CIFAR-10', \n",
    "                'mnist': 'MNIST', \n",
    "                'twenty_newsgroups': '20newsgroups',\n",
    "                'tinyimagenet100': 'TinyImageNet-100'}\n",
    "sub_metrics = ['Error', 'Coverage']\n",
    "\n",
    "def helper_find_files_and_read_dataframe(root_path, patterns=[r\"cifar10\"]):\n",
    "    #dm_df= OrderedDict((dm, None) for dm in dm_identifier.keys()) \n",
    "    dm_df= OrderedDict((dm, None) for dm in dm_identifier.keys()) \n",
    "    for root, _, files in os.walk(root_path):\n",
    "        for filename in files:\n",
    "            filepath = os.path.join(root, filename)\n",
    "            if os.path.isfile(filepath) and filepath.endswith(\".xlsx\"):\n",
    "                for pattern in patterns:\n",
    "                    if re.search(pattern, filename, re.IGNORECASE):\n",
    "                        if pattern in dm_df:  # Check if the key already exists\n",
    "                            dm_df[pattern] = pd.concat([dm_df[pattern], pd.read_excel(filepath, sheet_name=0).drop(columns=['Unnamed: 0'])], axis=0)\n",
    "                            #display(dm_df[pattern])\n",
    "                        else:\n",
    "                            dm_df[pattern] = pd.read_excel(filepath, sheet_name=0).drop(columns=['Unnamed: 0']).copy(deep=True)\n",
    "                        # dm_df[pattern].append(pd.read_excel(filepath, sheet_name=0).drop(columns=['Unnamed: 0']).copy(deep=True))\n",
    "                        break  # Stop checking patterns for this file\n",
    "    return dm_df \n",
    "\n",
    "def read_and_get_filtered_dataframes(root_path, patterns=[r\"cifar10\"]):\n",
    "    dm_df = helper_find_files_and_read_dataframe(root_path, patterns = patterns)\n",
    "    # Apply filter to all dataframes\n",
    "    for dm, df in dm_df.items():\n",
    "        if df is None:\n",
    "            continue\n",
    "        df1 = copy.copy(df) # Shallow copy to new dataframe\n",
    "        df1['calib_conf'] = df1['calib_conf'].fillna(\"None\")\n",
    "        df1['calib_conf'] = df1['calib_conf'].astype(str)\n",
    "\n",
    "        # Sort by col: Coverage-Mean in descending order, and then by col: calib_conf in ascending order\n",
    "        df2 = df1.sort_values([\"Coverage-Mean\", \"calib_conf\"], ascending = [False, True]).copy(deep=True)\n",
    "        # Retain the first row for each unique value in col: calib_conf\n",
    "        df3 = df2.drop_duplicates(subset=['calib_conf', 'training_conf'], keep='first').copy(deep=True)\n",
    "        dm_df[dm] = df3\n",
    "    return dm_df \n",
    "\n",
    "dm_df = read_and_get_filtered_dataframes(\n",
    "    root_path = \"../../../outputs/final_results/final_results_to_tex_table\", \n",
    "    patterns = dm_identifier.keys())\n",
    "\n",
    "display(dm_df['cifar10'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "cms_ = OrderedDict({'None': '-',\n",
    "                    'auto_label_opt_v0': 'Ours' ,\n",
    "                    'temp_scaling': 'TS',\n",
    "                    'dirichlet': 'Dirichlet',\n",
    "                    'scaling_binning': 'SB',\n",
    "                    'histogram_binning_top_label': 'Top-HB'})\n",
    "ttms_ = OrderedDict({'std_cross_entropy': 'Vanilla',\n",
    "                     'crl': 'CRL', \n",
    "                     'fmfp': 'FMFP', \n",
    "                     'squentropy': 'Squentropy'})\n",
    "visited = []\n",
    "body_txt= \"\"\n",
    "bs = \"\\\\\"\n",
    "num_dp = 2\n",
    "global_font_size = (8,11)\n",
    "std_font_size = (6, 11)\n",
    "pm_factor = 0.6 \n",
    "\n",
    "for tm, cm in itertools.product(ttms_.keys(), cms_.keys()):\n",
    "    # Add post-hoc method name \n",
    "    # cross_prod_i = cm.replace(\"_\", \"\\\\_\")\n",
    "    cross_prod_i = cms_[cm]\n",
    "    if tm not in visited:\n",
    "        #temp_tm = tm.replace(\"_\", \"\\\\_\")\n",
    "        temp_tm = ttms_[tm]\n",
    "        cross_prod_i = rf\"\"\"\\multirow{{6}}{{*}}{{{temp_tm}}}                     & \"\"\" + cross_prod_i \n",
    "        visited.append(tm)\n",
    "    else:\n",
    "        cross_prod_i = \" \".join([\"                                 & \", cross_prod_i]) \n",
    "\n",
    "    # For each dataset, add columns for Error and Coverage \n",
    "    for dm, df in dm_df.items():\n",
    "        # print(dm)\n",
    "        # display(df)\n",
    "        if df is not None:\n",
    "            mask1 = (df[\"calib_conf\"] == f\"{cm}\") & (df[\"training_conf\"] == f\"{tm}\")\n",
    "            al_mean = df[mask1]['Auto-Labeling-Err-Mean'].values[0] if not df[mask1]['Auto-Labeling-Err-Mean'].empty else -1 \n",
    "            al_std = df[mask1]['Auto-Labeling-Err-Std'].values[0] if not df[mask1]['Auto-Labeling-Err-Std'].empty else -1 \n",
    "            c_mean = df[mask1]['Coverage-Mean'].values[0] if not df[mask1]['Coverage-Mean'].empty else -1 \n",
    "            c_std= df[mask1]['Coverage-Std'].values[0] if not df[mask1]['Coverage-Std'].empty else -1 \n",
    "\n",
    "            # Determine if al_mean and c_mean should be bold\n",
    "            mask2 = (df[\"training_conf\"] == f\"{tm}\")\n",
    "            if al_mean == df[mask2]['Auto-Labeling-Err-Mean'].min():\n",
    "                al_mean_str_format, al_std_str_format = (rf\"\\textbf\" + \"{\" + rf\"{al_mean:.{num_dp}f}\" + \"}\", rf\"\\textbf\" + \"{\" + rf\"{al_std:.{num_dp}f}\" + \"}\")\n",
    "                al_plus_minus = f\"\\\\scalebox{{{pm_factor}}}{{\\\\ensuremath{{\\\\bm{{\\\\pm}}}}}}\"\n",
    "            else:\n",
    "                al_mean_str_format, al_std_str_format = (rf\"{al_mean:.{num_dp}f}\", rf\"{al_std:.{num_dp}f}\")\n",
    "                al_plus_minus = f\"\\\\scalebox{{{pm_factor}}}{{\\\\ensuremath{{{bs}pm}}}}\"\n",
    "\n",
    "            if c_mean == df[mask2]['Coverage-Mean'].max():\n",
    "                c_mean_str_format, c_std_str_format = (rf\"\\textbf\" + \"{\" + rf\"{c_mean:.{num_dp}f}\" + \"}\",rf\"\\textbf\" + \"{\" + rf\"{c_std:.{num_dp}f}\" + \"}\")\n",
    "                c_plus_minus = f\"\\\\scalebox{{{pm_factor}}}{{\\\\ensuremath{{\\\\bm{{\\\\pm}}}}}}\"\n",
    "            else: \n",
    "                c_mean_str_format, c_std_str_format = (rf\"{c_mean:.{num_dp}f}\", rf\"{c_std:.{num_dp}f}\")\n",
    "                c_plus_minus = f\"\\\\scalebox{{{pm_factor}}}{{\\\\ensuremath{{{bs}pm}}}}\"\n",
    "\n",
    "            \n",
    "        else:\n",
    "            al_mean, al_std, c_mean, c_std = -1, -1, -1, -1 \n",
    "        open_std_font = \"{\" + f\"{bs}fontsize{{{std_font_size[0]}}}{{{std_font_size[1]}}}{bs}selectfont\"\n",
    "        closing_std_font = \"}\" \n",
    "        # plus_minus = rf\" \\scalebox{{{pm_factor}}}\" + \"{\" + \"\\ensuremath\" + \"{\"  \"${bs}pm$ \" + \"}\" + \"}\"\n",
    "        # plus_minus = f\"\\\\scalebox{{{pm_factor}}}{{\\\\ensuremath{{{bs}pm}}}}\"\n",
    "\n",
    "        # cross_prod_i = cross_prod_i + \" & \" + f\"\"\" { rf\"{al_mean:.{num_dp}f}\" + plus_minus + open_std_font + rf\"{al_std:.{num_dp}f}\" } \"\"\" + closing_std_font + \" & \" + f\"\"\" { rf\"{c_mean:.{num_dp}f}\" + plus_minus + open_std_font + rf\"{c_std:.{num_dp}f}\" } \"\"\" + closing_std_font\n",
    "        cross_prod_i = cross_prod_i + \" & \" + f\"\"\" { al_mean_str_format + al_plus_minus + open_std_font + al_std_str_format} \"\"\" + closing_std_font + \" & \" + f\"\"\" { c_mean_str_format + c_plus_minus + open_std_font + c_std_str_format} \"\"\" + closing_std_font\n",
    "\n",
    "    if cm == list(cms_.keys())[-1] and tm == list(ttms_.keys())[-1]:\n",
    "        line = rf\"\\bottomrule\"\n",
    "    elif cm == list(cms_.keys())[-1] and tm != list(ttms_.keys())[-1]:\n",
    "        line = \"\\hline\"\n",
    "    else:\n",
    "        line = \"\"\n",
    "    cross_prod_i = cross_prod_i + r\"\\\\\" + line\n",
    "    body_txt= body_txt+ cross_prod_i + \"\\n\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "\n",
    "#metrics_txt = \" & \".join( [ \"\\multicolumn{1}{c}\" + \"{\" + rf\"\\textbf\" + \"{\" + sm + \"}\" + \"}\" for sm in sub_metrics] * len(data_models))\n",
    "metrics_txt = \" & \".join( [ \"\\multicolumn{1}{c}\" + \"{\" + rf\"\\textbf\" + \"{\" + sm + \"}\" + \"}\" for sm in sub_metrics] * len(dm_identifier.keys()))\n",
    "#data_models_txt = ' & ' + ' & '.join([rf\"\\multicolumn{{{len(sub_metrics)}}}{{c}}\" + \"{\" + rf\"\\textbf\" + rf\"{{{dm_identifier[dm]}}}\" + \"}\" for dm in data_models])\n",
    "data_models_txt = ' & ' + ' & '.join([rf\"\\multicolumn{{{len(sub_metrics)}}}{{c}}\" + \"{\" + rf\"\\textbf\" + rf\"{{{dm_identifier[dm]}}}\" + \"}\" for dm in dm_identifier.keys()])\n",
    "caption = \"Example TBAL LaTeX Table\"\n",
    "\n",
    "template = rf\"\"\"\n",
    "\\begin{{table*}}[t]\n",
    "\\fontsize{{{global_font_size[0]}}}{{{global_font_size[1]}}}\\selectfont\n",
    "\\begin{{tabular}}{{llllllllll}}\n",
    "\\toprule\n",
    "\\multicolumn{{1}}{{c}}{{\\multirow{{2}}{{*}}{{\\textbf{{Train-time}}}}}} & \\multicolumn{{1}}{{c}}{{\\multirow{{2}}{{*}}{{\\textbf{{Post-hoc}}}}}} {data_models_txt} \\\\ \\cline{{3-10}}\n",
    "\\multicolumn{{1}}{{c}}{{}}                      & \\multicolumn{{1}}{{c}}{{}}  & {metrics_txt} \\\\ \\toprule \n",
    "\"\"\" + body_txt + rf\"\"\"\n",
    "\\end{{tabular}}\n",
    "\\caption{{{caption}}}\n",
    "\\end{{table*}}\"\"\"\n",
    "\n",
    "# TODO: Add new column shading color features \n",
    "\n",
    "# template = rf\"\"\"\n",
    "# \\begin{{table*}}[t]\n",
    "# \\fontsize{{{global_font_size[0]}}}{{{global_font_size[1]}}}\\selectfont\n",
    "# \\begin{{tabular}}{{lll>{{\\columncolor{{gray}}}}lllllll}}\n",
    "# \\toprule\n",
    "# \\multicolumn{{1}}{{c}}{{\\multirow{{2}}{{*}}{{\\textbf{{Train-time}}}}}} & \\multicolumn{{1}}{{c}}{{\\multirow{{2}}{{*}}{{\\textbf{{Post-hoc}}}}}} {data_models_txt} \\\\ \\cline{{3-10}}\n",
    "# \\multicolumn{{1}}{{c}}{{}}                      & \\multicolumn{{1}}{{c}}{{}}  & {metrics_txt} \\\\ \\toprule \n",
    "# \"\"\" + body_txt + rf\"\"\"\n",
    "# \\end{{tabular}}\n",
    "# \\caption{{{caption}}}\n",
    "# \\end{{table*}}\"\"\"\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "with open(\"./final_table_latex_template.txt\", \"w\") as file:\n",
    "    file.write(template)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "ml-kernel-tbal",
   "language": "python",
   "name": "ml-kernel-tbal"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
