{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "0504557f",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "from pmlb import fetch_data, regression_dataset_names"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "a719faec",
   "metadata": {},
   "outputs": [],
   "source": [
    "data_list = [\n",
    "    \"1027_ESL\",\n",
    "    \"1028_SWD\",\n",
    "    \"1029_LEV\",\n",
    "    \"1030_ERA\",\n",
    "    \"1089_USCrime\",\n",
    "    \"1096_FacultySalaries\",\n",
    "    \"1191_BNG_pbc\",\n",
    "    \"1193_BNG_lowbwt\",\n",
    "    \"1196_BNG_pharynx\",\n",
    "    \"1199_BNG_echoMonths\",\n",
    "    \"1201_BNG_breastTumor\",\n",
    "    \"192_vineyard\",\n",
    "    \"195_auto_price\",\n",
    "    \"197_cpu_act\",\n",
    "    \"201_pol\",\n",
    "    \"207_autoPrice\",\n",
    "    \"210_cloud\",\n",
    "    \"215_2dplanes\",\n",
    "    \"218_house_8L\",\n",
    "    \"225_puma8NH\",\n",
    "    \"227_cpu_small\",\n",
    "    \"228_elusage\",\n",
    "    \"229_pwLinear\",\n",
    "    \"230_machine_cpu\",\n",
    "    \"294_satellite_image\",\n",
    "    \"344_mv\",\n",
    "    \"4544_GeographicalOriginalofMusic\",\n",
    "    \"485_analcatdata_vehicle\",\n",
    "    \"503_wind\",\n",
    "    \"505_tecator\",\n",
    "    \"519_vinnie\",\n",
    "    \"522_pm10\",\n",
    "    \"523_analcatdata_neavote\",\n",
    "    \"527_analcatdata_election2000\",\n",
    "    \"529_pollen\",\n",
    "    \"537_houses\",\n",
    "    \"542_pollution\",\n",
    "    \"547_no2\",\n",
    "    \"556_analcatdata_apnea2\",\n",
    "    \"557_analcatdata_apnea1\",\n",
    "    \"560_bodyfat\",\n",
    "    \"561_cpu\",\n",
    "    \"562_cpu_small\",\n",
    "    \"564_fried\",\n",
    "    \"573_cpu_act\",\n",
    "    \"574_house_16H\",\n",
    "    \"579_fri_c0_250_5\",\n",
    "    \"581_fri_c3_500_25\",\n",
    "    \"582_fri_c1_500_25\",\n",
    "    \"583_fri_c1_1000_50\",\n",
    "    \"584_fri_c4_500_25\",\n",
    "    \"586_fri_c3_1000_25\",\n",
    "    \"588_fri_c4_1000_100\",\n",
    "    \"589_fri_c2_1000_25\",\n",
    "    \"590_fri_c0_1000_50\",\n",
    "    \"591_fri_c1_100_10\",\n",
    "    \"592_fri_c4_1000_25\",\n",
    "    \"593_fri_c1_1000_10\",\n",
    "    \"594_fri_c2_100_5\",\n",
    "    \"595_fri_c0_1000_10\",\n",
    "    \"596_fri_c2_250_5\",\n",
    "    \"597_fri_c2_500_5\",\n",
    "    \"598_fri_c0_1000_25\",\n",
    "    \"599_fri_c2_1000_5\",\n",
    "    \"601_fri_c1_250_5\",\n",
    "    \"602_fri_c3_250_10\",\n",
    "    \"603_fri_c0_250_50\",\n",
    "    \"604_fri_c4_500_10\",\n",
    "    \"605_fri_c2_250_25\",\n",
    "    \"606_fri_c2_1000_10\",\n",
    "    \"607_fri_c4_1000_50\",\n",
    "    \"608_fri_c3_1000_10\",\n",
    "    \"609_fri_c0_1000_5\",\n",
    "    \"611_fri_c3_100_5\",\n",
    "    \"612_fri_c1_1000_5\",\n",
    "    \"613_fri_c3_250_5\",\n",
    "    \"615_fri_c4_250_10\",\n",
    "    \"616_fri_c4_500_50\",\n",
    "    \"617_fri_c3_500_5\",\n",
    "    \"618_fri_c3_1000_50\",\n",
    "    \"620_fri_c1_1000_25\",\n",
    "    \"621_fri_c0_100_10\",\n",
    "    \"622_fri_c2_1000_50\",\n",
    "    \"623_fri_c4_1000_10\",\n",
    "    \"624_fri_c0_100_5\",\n",
    "    \"626_fri_c2_500_50\",\n",
    "    \"627_fri_c2_500_10\",\n",
    "    \"628_fri_c3_1000_5\",\n",
    "    \"631_fri_c1_500_5\",\n",
    "    \"633_fri_c0_500_25\",\n",
    "    \"634_fri_c2_100_10\",\n",
    "    \"635_fri_c0_250_10\",\n",
    "    \"637_fri_c1_500_50\",\n",
    "    \"641_fri_c1_500_10\",\n",
    "    \"643_fri_c2_500_25\",\n",
    "    \"644_fri_c4_250_25\",\n",
    "    \"645_fri_c3_500_50\",\n",
    "    \"646_fri_c3_500_10\",\n",
    "    \"647_fri_c1_250_10\",\n",
    "    \"648_fri_c1_250_50\",\n",
    "    \"649_fri_c0_500_5\",\n",
    "    \"650_fri_c0_500_50\",\n",
    "    \"651_fri_c0_100_25\",\n",
    "    \"653_fri_c0_250_25\",\n",
    "    \"654_fri_c0_500_10\",\n",
    "    \"656_fri_c1_100_5\",\n",
    "    \"657_fri_c2_250_10\",\n",
    "    \"658_fri_c3_250_25\",\n",
    "    \"659_sleuth_ex1714\",\n",
    "    \"663_rabe_266\",\n",
    "    \"665_sleuth_case2002\",\n",
    "    \"666_rmftsa_ladata\",\n",
    "    \"678_visualizing_environmental\",\n",
    "    \"687_sleuth_ex1605\",\n",
    "    \"690_visualizing_galaxy\",\n",
    "    \"695_chatfield_4\",\n",
    "    \"706_sleuth_case1202\",\n",
    "    \"712_chscase_geyser1\",\n",
    "    \"banana\",\n",
    "    \"titanic\"\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "50e4d6b3",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import json\n",
    "import pandas as pd\n",
    "\n",
    "def load_jsons_to_long_df(directory):\n",
    "    records = []\n",
    "\n",
    "    for filename in os.listdir(directory):\n",
    "        if filename.endswith('.json'):\n",
    "            filepath = os.path.join(directory, filename)\n",
    "            with open(filepath, 'r') as f:\n",
    "                data = json.load(f)\n",
    "\n",
    "            for model, model_data in data.items():\n",
    "                tau = model_data.get('tau')\n",
    "                for metric, metric_data in model_data.items():\n",
    "                    if metric == 'tau':\n",
    "                        continue\n",
    "                    for dataset, values in metric_data.items():\n",
    "                        for run_idx, value in enumerate(values):\n",
    "                            records.append({\n",
    "                                'filename': filename,\n",
    "                                'model': model,\n",
    "                                'tau': tau,\n",
    "                                'metric': metric,\n",
    "                                'dataset': dataset,\n",
    "                                'run': run_idx,\n",
    "                                'value': value\n",
    "                            })\n",
    "\n",
    "    df = pd.DataFrame.from_records(records)\n",
    "    return df\n",
    "\n",
    "# Example usage:\n",
    "directory = 'results/'  # Replace with your actual directory path\n",
    "df_long = load_jsons_to_long_df(directory)\n",
    "# TODO: change to results_timing and re-run analyses\n",
    "df_long_timing = load_jsons_to_long_df('results/')\n",
    "# df_long_timing = load_jsons_to_long_df('results_timing/')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "48225fbe",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>filename</th>\n",
       "      <th>model</th>\n",
       "      <th>tau</th>\n",
       "      <th>metric</th>\n",
       "      <th>dataset</th>\n",
       "      <th>run</th>\n",
       "      <th>value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>0</td>\n",
       "      <td>0.013109</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>1</td>\n",
       "      <td>0.012958</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>2</td>\n",
       "      <td>0.018811</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>3</td>\n",
       "      <td>0.013429</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>4</td>\n",
       "      <td>0.023515</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21615</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>0</td>\n",
       "      <td>0.137714</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21616</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>1</td>\n",
       "      <td>0.255429</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21617</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>2</td>\n",
       "      <td>0.504053</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21618</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>3</td>\n",
       "      <td>0.935991</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21619</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>4</td>\n",
       "      <td>1.187911</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>21620 rows × 7 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                               filename           model  tau    metric  \\\n",
       "0       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "1       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "2       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "3       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "4       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "...                                 ...             ...  ...       ...   \n",
       "21615  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21616  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21617  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21618  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21619  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "\n",
       "                 dataset  run     value  \n",
       "0       631_fri_c1_500_5    0  0.013109  \n",
       "1       631_fri_c1_500_5    1  0.012958  \n",
       "2       631_fri_c1_500_5    2  0.018811  \n",
       "3       631_fri_c1_500_5    3  0.013429  \n",
       "4       631_fri_c1_500_5    4  0.023515  \n",
       "...                  ...  ...       ...  \n",
       "21615  603_fri_c0_250_50    0  0.137714  \n",
       "21616  603_fri_c0_250_50    1  0.255429  \n",
       "21617  603_fri_c0_250_50    2  0.504053  \n",
       "21618  603_fri_c0_250_50    3  0.935991  \n",
       "21619  603_fri_c0_250_50    4  1.187911  \n",
       "\n",
       "[21620 rows x 7 columns]"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_long_timing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "b55b1ed6",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_long['dataset_id'] = df_long['dataset'].str.split('_').str[0]\n",
    "df_long_timing['dataset_id'] = df_long_timing['dataset'].str.split('_').str[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "14bbed27",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "    tau           model    metric     value\n",
      "1   0.5    DecisionTree  coverage  0.087895\n",
      "5   0.5        LightGBM  coverage  0.064430\n",
      "10  0.5  LinearQuantile  coverage  0.065201\n",
      "15  0.5             SQR  coverage  0.082943\n",
      "20  0.9    DecisionTree  coverage  0.066118\n",
      "24  0.9        LightGBM  coverage  0.039402\n",
      "29  0.9  LinearQuantile  coverage  0.286541\n",
      "34  0.9             SQR  coverage  0.049139\n",
      "    tau           model    metric     value\n",
      "1   0.5    DecisionTree  coverage  0.103398\n",
      "5   0.5        LightGBM  coverage  0.069138\n",
      "10  0.5  LinearQuantile  coverage  0.080679\n",
      "15  0.5             SQR  coverage  0.091786\n",
      "20  0.9    DecisionTree  coverage  0.057689\n",
      "24  0.9        LightGBM  coverage  0.037856\n",
      "29  0.9  LinearQuantile  coverage  0.207353\n",
      "34  0.9             SQR  coverage  0.061283\n"
     ]
    }
   ],
   "source": [
    "avg_df = df_long.groupby(['tau', 'model', 'metric'])['value'].mean().reset_index()\n",
    "avg_df_timing = df_long_timing.groupby(['tau', 'model', 'metric'])['value'].mean().reset_index()\n",
    "stdev_df = df_long.groupby(['tau', 'model', 'metric'])['value'].std().reset_index()\n",
    "print(avg_df[avg_df.metric == 'coverage'])\n",
    "print(stdev_df[stdev_df.metric == 'coverage'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "6f37d133",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "    tau           model  metric     value\n",
      "2   0.5    DecisionTree  losses  0.038794\n",
      "6   0.5        LightGBM  losses  0.042355\n",
      "11  0.5  LinearQuantile  losses  0.058600\n",
      "16  0.5             SQR  losses  0.030043\n",
      "21  0.9    DecisionTree  losses  0.019703\n",
      "25  0.9        LightGBM  losses  0.024632\n",
      "30  0.9  LinearQuantile  losses  0.053503\n",
      "35  0.9             SQR  losses  0.014851\n",
      "    tau           model  metric     value\n",
      "2   0.5    DecisionTree  losses  0.017538\n",
      "6   0.5        LightGBM  losses  0.022201\n",
      "11  0.5  LinearQuantile  losses  0.030018\n",
      "16  0.5             SQR  losses  0.021463\n",
      "21  0.9    DecisionTree  losses  0.009538\n",
      "25  0.9        LightGBM  losses  0.012220\n",
      "30  0.9  LinearQuantile  losses  0.044210\n",
      "35  0.9             SQR  losses  0.013473\n"
     ]
    }
   ],
   "source": [
    "avg_df = df_long.groupby(['tau', 'model', 'metric'])['value'].mean().reset_index()\n",
    "stdev_df = df_long.groupby(['tau', 'model', 'metric'])['value'].std().reset_index()\n",
    "print(avg_df[avg_df.metric == 'losses'])\n",
    "print(stdev_df[stdev_df.metric == 'losses'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "559a029f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "    tau           model    metric     value\n",
      "1   0.5    DecisionTree  coverage  0.087895\n",
      "5   0.5        LightGBM  coverage  0.064430\n",
      "10  0.5  LinearQuantile  coverage  0.065201\n",
      "15  0.5             SQR  coverage  0.082943\n",
      "20  0.9    DecisionTree  coverage  0.066118\n",
      "24  0.9        LightGBM  coverage  0.039402\n",
      "29  0.9  LinearQuantile  coverage  0.286541\n",
      "34  0.9             SQR  coverage  0.049139\n"
     ]
    }
   ],
   "source": [
    "print(avg_df[avg_df.metric == 'coverage'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "ec4e6551",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "    tau           model    metric        value\n",
      "3   0.5    DecisionTree  time_all     0.315487\n",
      "7   0.5        LightGBM  time_all     5.008716\n",
      "12  0.5  LinearQuantile  time_all    10.309813\n",
      "17  0.5             SQR  time_all  3299.124167\n",
      "22  0.9    DecisionTree  time_all     0.347780\n",
      "26  0.9        LightGBM  time_all     9.811793\n",
      "31  0.9  LinearQuantile  time_all    11.506157\n",
      "36  0.9             SQR  time_all  1906.944231\n"
     ]
    }
   ],
   "source": [
    "print(avg_df[avg_df.metric == 'time_all'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "771d7160",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "    tau           model    metric        value\n",
      "4   0.5    DecisionTree  time_fit     0.030239\n",
      "8   0.5        LightGBM  time_fit     0.580455\n",
      "13  0.5  LinearQuantile  time_fit     0.638731\n",
      "18  0.5             SQR  time_fit  3299.124167\n",
      "23  0.9    DecisionTree  time_fit     0.027797\n",
      "27  0.9        LightGBM  time_fit     2.427570\n",
      "32  0.9  LinearQuantile  time_fit     0.579071\n",
      "37  0.9             SQR  time_fit  1906.944231\n"
     ]
    }
   ],
   "source": [
    "print(avg_df[avg_df.metric == 'time_fit'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "db28968c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "    tau           model    metric       value\n",
      "3   0.5    DecisionTree  time_all    0.062334\n",
      "7   0.5        LightGBM  time_all    0.211015\n",
      "12  0.5  LinearQuantile  time_all    0.461874\n",
      "17  0.5             SQR  time_all  487.705531\n",
      "22  0.9    DecisionTree  time_all    0.067351\n",
      "26  0.9        LightGBM  time_all    0.173563\n",
      "31  0.9  LinearQuantile  time_all    0.529954\n",
      "36  0.9             SQR  time_all  471.634248\n"
     ]
    }
   ],
   "source": [
    "median_df = df_long.groupby(['tau', 'model', 'metric'])['value'].median().reset_index()\n",
    "stdev_df = df_long.groupby(['tau', 'model', 'metric'])['value'].std().reset_index()\n",
    "print(median_df[median_df.metric == 'time_all'])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "869d1839",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "    tau           model    metric       value\n",
      "4   0.5    DecisionTree  time_fit    0.008075\n",
      "8   0.5        LightGBM  time_fit    0.049278\n",
      "13  0.5  LinearQuantile  time_fit    0.041045\n",
      "18  0.5             SQR  time_fit  487.705531\n",
      "23  0.9    DecisionTree  time_fit    0.005041\n",
      "27  0.9        LightGBM  time_fit    0.036523\n",
      "32  0.9  LinearQuantile  time_fit    0.047319\n",
      "37  0.9             SQR  time_fit  471.634248\n"
     ]
    }
   ],
   "source": [
    "print(median_df[median_df.metric == 'time_fit'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "6007f7d9",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>filename</th>\n",
       "      <th>model</th>\n",
       "      <th>tau</th>\n",
       "      <th>metric</th>\n",
       "      <th>dataset</th>\n",
       "      <th>run</th>\n",
       "      <th>value</th>\n",
       "      <th>dataset_id</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>0</td>\n",
       "      <td>0.013109</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>1</td>\n",
       "      <td>0.012958</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>2</td>\n",
       "      <td>0.018811</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>3</td>\n",
       "      <td>0.013429</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>4</td>\n",
       "      <td>0.023515</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21615</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>0</td>\n",
       "      <td>0.137714</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21616</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>1</td>\n",
       "      <td>0.255429</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21617</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>2</td>\n",
       "      <td>0.504053</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21618</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>3</td>\n",
       "      <td>0.935991</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21619</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>4</td>\n",
       "      <td>1.187911</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>21620 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                               filename           model  tau    metric  \\\n",
       "0       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "1       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "2       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "3       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "4       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "...                                 ...             ...  ...       ...   \n",
       "21615  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21616  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21617  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21618  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21619  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "\n",
       "                 dataset  run     value dataset_id  \n",
       "0       631_fri_c1_500_5    0  0.013109        631  \n",
       "1       631_fri_c1_500_5    1  0.012958        631  \n",
       "2       631_fri_c1_500_5    2  0.018811        631  \n",
       "3       631_fri_c1_500_5    3  0.013429        631  \n",
       "4       631_fri_c1_500_5    4  0.023515        631  \n",
       "...                  ...  ...       ...        ...  \n",
       "21615  603_fri_c0_250_50    0  0.137714        603  \n",
       "21616  603_fri_c0_250_50    1  0.255429        603  \n",
       "21617  603_fri_c0_250_50    2  0.504053        603  \n",
       "21618  603_fri_c0_250_50    3  0.935991        603  \n",
       "21619  603_fri_c0_250_50    4  1.187911        603  \n",
       "\n",
       "[21620 rows x 8 columns]"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_long"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "83dba10e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dataset_id</th>\n",
       "      <th>tau</th>\n",
       "      <th>model</th>\n",
       "      <th>metric</th>\n",
       "      <th>value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>complexity</td>\n",
       "      <td>127.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>complexity</td>\n",
       "      <td>34.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>SQR</td>\n",
       "      <td>complexity</td>\n",
       "      <td>8.600000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>coverage</td>\n",
       "      <td>0.276667</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>LightGBM</td>\n",
       "      <td>coverage</td>\n",
       "      <td>0.053293</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  dataset_id  tau           model      metric       value\n",
       "0       1027  0.5    DecisionTree  complexity  127.000000\n",
       "5       1027  0.5  LinearQuantile  complexity   34.000000\n",
       "8       1027  0.5             SQR  complexity    8.600000\n",
       "1       1027  0.5    DecisionTree    coverage    0.276667\n",
       "3       1027  0.5        LightGBM    coverage    0.053293"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "avg_df = df_long[~df_long.metric.isin(['time_fit', 'time_all'])].groupby(['dataset_id', 'tau', 'model', 'metric'])['value'].mean().reset_index().sort_values(['tau', 'dataset_id','metric'])\n",
    "avg_df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "3048dfda",
   "metadata": {},
   "outputs": [],
   "source": [
    "avg_df_timing = df_long_timing[df_long_timing.metric == 'time_all'].groupby(['dataset_id', 'tau', 'model', 'metric'])['value'].mean().reset_index()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "8611630e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>filename</th>\n",
       "      <th>model</th>\n",
       "      <th>tau</th>\n",
       "      <th>metric</th>\n",
       "      <th>dataset</th>\n",
       "      <th>run</th>\n",
       "      <th>value</th>\n",
       "      <th>dataset_id</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>0</td>\n",
       "      <td>0.013109</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>1</td>\n",
       "      <td>0.012958</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>2</td>\n",
       "      <td>0.018811</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>3</td>\n",
       "      <td>0.013429</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>results50_631_fri_c1_500_5.json</td>\n",
       "      <td>SQR</td>\n",
       "      <td>0.5</td>\n",
       "      <td>losses</td>\n",
       "      <td>631_fri_c1_500_5</td>\n",
       "      <td>4</td>\n",
       "      <td>0.023515</td>\n",
       "      <td>631</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21615</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>0</td>\n",
       "      <td>0.137714</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21616</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>1</td>\n",
       "      <td>0.255429</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21617</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>2</td>\n",
       "      <td>0.504053</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21618</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>3</td>\n",
       "      <td>0.935991</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21619</th>\n",
       "      <td>results90_603_fri_c0_250_50.json</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>0.9</td>\n",
       "      <td>time_fit</td>\n",
       "      <td>603_fri_c0_250_50</td>\n",
       "      <td>4</td>\n",
       "      <td>1.187911</td>\n",
       "      <td>603</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>21620 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                               filename           model  tau    metric  \\\n",
       "0       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "1       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "2       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "3       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "4       results50_631_fri_c1_500_5.json             SQR  0.5    losses   \n",
       "...                                 ...             ...  ...       ...   \n",
       "21615  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21616  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21617  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21618  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "21619  results90_603_fri_c0_250_50.json  LinearQuantile  0.9  time_fit   \n",
       "\n",
       "                 dataset  run     value dataset_id  \n",
       "0       631_fri_c1_500_5    0  0.013109        631  \n",
       "1       631_fri_c1_500_5    1  0.012958        631  \n",
       "2       631_fri_c1_500_5    2  0.018811        631  \n",
       "3       631_fri_c1_500_5    3  0.013429        631  \n",
       "4       631_fri_c1_500_5    4  0.023515        631  \n",
       "...                  ...  ...       ...        ...  \n",
       "21615  603_fri_c0_250_50    0  0.137714        603  \n",
       "21616  603_fri_c0_250_50    1  0.255429        603  \n",
       "21617  603_fri_c0_250_50    2  0.504053        603  \n",
       "21618  603_fri_c0_250_50    3  0.935991        603  \n",
       "21619  603_fri_c0_250_50    4  1.187911        603  \n",
       "\n",
       "[21620 rows x 8 columns]"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_long_timing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "fa7a1f12",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1027_ESL\n",
      "1028_SWD\n",
      "1029_LEV\n",
      "1030_ERA\n",
      "1089_USCrime\n",
      "1096_FacultySalaries\n",
      "1191_BNG_pbc\n",
      "1193_BNG_lowbwt\n",
      "1196_BNG_pharynx\n",
      "1199_BNG_echoMonths\n",
      "1201_BNG_breastTumor\n",
      "192_vineyard\n",
      "195_auto_price\n",
      "Error for 195_auto_price\n",
      "197_cpu_act\n",
      "201_pol\n",
      "207_autoPrice\n",
      "Error for 207_autoPrice\n",
      "210_cloud\n",
      "215_2dplanes\n",
      "218_house_8L\n",
      "225_puma8NH\n",
      "227_cpu_small\n",
      "228_elusage\n",
      "229_pwLinear\n",
      "230_machine_cpu\n",
      "294_satellite_image\n",
      "344_mv\n",
      "4544_GeographicalOriginalofMusic\n",
      "485_analcatdata_vehicle\n",
      "503_wind\n",
      "505_tecator\n",
      "519_vinnie\n",
      "522_pm10\n",
      "523_analcatdata_neavote\n",
      "527_analcatdata_election2000\n",
      "529_pollen\n",
      "537_houses\n",
      "542_pollution\n",
      "547_no2\n",
      "556_analcatdata_apnea2\n",
      "557_analcatdata_apnea1\n",
      "560_bodyfat\n",
      "561_cpu\n",
      "562_cpu_small\n",
      "564_fried\n",
      "573_cpu_act\n",
      "574_house_16H\n",
      "579_fri_c0_250_5\n",
      "581_fri_c3_500_25\n",
      "582_fri_c1_500_25\n",
      "583_fri_c1_1000_50\n",
      "584_fri_c4_500_25\n",
      "586_fri_c3_1000_25\n",
      "588_fri_c4_1000_100\n",
      "589_fri_c2_1000_25\n",
      "590_fri_c0_1000_50\n",
      "591_fri_c1_100_10\n",
      "592_fri_c4_1000_25\n",
      "593_fri_c1_1000_10\n",
      "594_fri_c2_100_5\n",
      "595_fri_c0_1000_10\n",
      "596_fri_c2_250_5\n",
      "597_fri_c2_500_5\n",
      "598_fri_c0_1000_25\n",
      "599_fri_c2_1000_5\n",
      "601_fri_c1_250_5\n",
      "602_fri_c3_250_10\n",
      "603_fri_c0_250_50\n",
      "604_fri_c4_500_10\n",
      "605_fri_c2_250_25\n",
      "606_fri_c2_1000_10\n",
      "607_fri_c4_1000_50\n",
      "608_fri_c3_1000_10\n",
      "609_fri_c0_1000_5\n",
      "611_fri_c3_100_5\n",
      "612_fri_c1_1000_5\n",
      "613_fri_c3_250_5\n",
      "615_fri_c4_250_10\n",
      "616_fri_c4_500_50\n",
      "617_fri_c3_500_5\n",
      "618_fri_c3_1000_50\n",
      "620_fri_c1_1000_25\n",
      "621_fri_c0_100_10\n",
      "622_fri_c2_1000_50\n",
      "623_fri_c4_1000_10\n",
      "624_fri_c0_100_5\n",
      "626_fri_c2_500_50\n",
      "627_fri_c2_500_10\n",
      "628_fri_c3_1000_5\n",
      "631_fri_c1_500_5\n",
      "633_fri_c0_500_25\n",
      "634_fri_c2_100_10\n",
      "635_fri_c0_250_10\n",
      "637_fri_c1_500_50\n",
      "641_fri_c1_500_10\n",
      "643_fri_c2_500_25\n",
      "644_fri_c4_250_25\n",
      "645_fri_c3_500_50\n",
      "646_fri_c3_500_10\n",
      "647_fri_c1_250_10\n",
      "648_fri_c1_250_50\n",
      "649_fri_c0_500_5\n",
      "650_fri_c0_500_50\n",
      "651_fri_c0_100_25\n",
      "653_fri_c0_250_25\n",
      "654_fri_c0_500_10\n",
      "656_fri_c1_100_5\n",
      "657_fri_c2_250_10\n",
      "658_fri_c3_250_25\n",
      "659_sleuth_ex1714\n",
      "663_rabe_266\n",
      "665_sleuth_case2002\n",
      "666_rmftsa_ladata\n",
      "678_visualizing_environmental\n",
      "687_sleuth_ex1605\n",
      "690_visualizing_galaxy\n",
      "695_chatfield_4\n",
      "706_sleuth_case1202\n",
      "712_chscase_geyser1\n",
      "banana\n",
      "titanic\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>$d$</th>\n",
       "      <th>$n$</th>\n",
       "      <th>ids</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>4</td>\n",
       "      <td>488</td>\n",
       "      <td>1027</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>10</td>\n",
       "      <td>1000</td>\n",
       "      <td>1028</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>4</td>\n",
       "      <td>1000</td>\n",
       "      <td>1029</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>1000</td>\n",
       "      <td>1030</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>13</td>\n",
       "      <td>47</td>\n",
       "      <td>1089</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   $d$   $n$   ids\n",
       "0    4   488  1027\n",
       "1   10  1000  1028\n",
       "2    4  1000  1029\n",
       "3    4  1000  1030\n",
       "4   13    47  1089"
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Create dictionary with dataset lengths\n",
    "dataset_info = {\n",
    "    'ids': [],\n",
    "    '$n$': [],\n",
    "    '$d$': [],\n",
    "}\n",
    "for dataset_name in regression_dataset_names:\n",
    "    if dataset_name in data_list:\n",
    "        try:\n",
    "            print(dataset_name)\n",
    "            data = fetch_data(dataset_name, return_X_y=True)\n",
    "            X, y = data\n",
    "            id = dataset_name.split('_')[0]\n",
    "            dataset_info['ids'].append(id)\n",
    "            dataset_info['$n$'].append(X.shape[0])\n",
    "            dataset_info['$d$'].append(X.shape[1])\n",
    "        except:\n",
    "            print(f\"Error for {dataset_name}\")\n",
    "\n",
    "df_info = pd.DataFrame.from_records(dataset_info)\n",
    "\n",
    "df_info.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "a3cd8639",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dataset_id</th>\n",
       "      <th>tau</th>\n",
       "      <th>model</th>\n",
       "      <th>metric</th>\n",
       "      <th>value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>complexity</td>\n",
       "      <td>127.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>complexity</td>\n",
       "      <td>34.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>SQR</td>\n",
       "      <td>complexity</td>\n",
       "      <td>8.600000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>coverage</td>\n",
       "      <td>0.276667</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>LightGBM</td>\n",
       "      <td>coverage</td>\n",
       "      <td>0.053293</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2506</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>SQR</td>\n",
       "      <td>coverage</td>\n",
       "      <td>0.098571</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2499</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>losses</td>\n",
       "      <td>0.070219</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2501</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>LightGBM</td>\n",
       "      <td>losses</td>\n",
       "      <td>0.067556</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2504</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>losses</td>\n",
       "      <td>0.065554</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2507</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>SQR</td>\n",
       "      <td>losses</td>\n",
       "      <td>0.065696</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2508 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     dataset_id  tau           model      metric       value\n",
       "0          1027  0.5    DecisionTree  complexity  127.000000\n",
       "5          1027  0.5  LinearQuantile  complexity   34.000000\n",
       "8          1027  0.5             SQR  complexity    8.600000\n",
       "1          1027  0.5    DecisionTree    coverage    0.276667\n",
       "3          1027  0.5        LightGBM    coverage    0.053293\n",
       "...         ...  ...             ...         ...         ...\n",
       "2506    titanic  0.9             SQR    coverage    0.098571\n",
       "2499    titanic  0.9    DecisionTree      losses    0.070219\n",
       "2501    titanic  0.9        LightGBM      losses    0.067556\n",
       "2504    titanic  0.9  LinearQuantile      losses    0.065554\n",
       "2507    titanic  0.9             SQR      losses    0.065696\n",
       "\n",
       "[2508 rows x 5 columns]"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "avg_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "dbac4d2f",
   "metadata": {},
   "outputs": [],
   "source": [
    "index_cols = ['dataset_id', 'tau',]\n",
    "pivot_cols = ['metric', 'model']\n",
    "avg_with_stats = pd.merge(avg_df, df_info, left_on=['dataset_id'], right_on=['ids'], how='inner')\n",
    "avg_with_stats_timing = pd.merge(avg_df_timing, df_info, left_on=['dataset_id'], right_on=['ids'], how='inner')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "e4660a6e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dataset_id</th>\n",
       "      <th>tau</th>\n",
       "      <th>model</th>\n",
       "      <th>metric</th>\n",
       "      <th>value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.048754</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>LightGBM</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.178550</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>time_all</td>\n",
       "      <td>1.546284</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>SQR</td>\n",
       "      <td>time_all</td>\n",
       "      <td>417.371688</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.9</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.048657</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>903</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.5</td>\n",
       "      <td>SQR</td>\n",
       "      <td>time_all</td>\n",
       "      <td>859.301180</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>904</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.133787</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>905</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>LightGBM</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.109384</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>906</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>time_all</td>\n",
       "      <td>1.012228</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>907</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>SQR</td>\n",
       "      <td>time_all</td>\n",
       "      <td>903.903540</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>908 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    dataset_id  tau           model    metric       value\n",
       "0         1027  0.5    DecisionTree  time_all    0.048754\n",
       "1         1027  0.5        LightGBM  time_all    0.178550\n",
       "2         1027  0.5  LinearQuantile  time_all    1.546284\n",
       "3         1027  0.5             SQR  time_all  417.371688\n",
       "4         1027  0.9    DecisionTree  time_all    0.048657\n",
       "..         ...  ...             ...       ...         ...\n",
       "903    titanic  0.5             SQR  time_all  859.301180\n",
       "904    titanic  0.9    DecisionTree  time_all    0.133787\n",
       "905    titanic  0.9        LightGBM  time_all    0.109384\n",
       "906    titanic  0.9  LinearQuantile  time_all    1.012228\n",
       "907    titanic  0.9             SQR  time_all  903.903540\n",
       "\n",
       "[908 rows x 5 columns]"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "avg_df_timing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "38180c24",
   "metadata": {},
   "outputs": [],
   "source": [
    "avg_all_stats = pd.concat([avg_with_stats, avg_with_stats_timing]).sort_values(['tau', 'dataset_id','metric'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "13f65f41",
   "metadata": {},
   "outputs": [],
   "source": [
    "pivot = avg_all_stats.pivot(index=['tau','dataset_id', '$n$', '$d$'], columns=['metric', 'model',], values=['value'])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "8c05e201",
   "metadata": {},
   "outputs": [],
   "source": [
    "pivot = avg_all_stats.pivot(index=['tau','dataset_id', '$n$', '$d$'], columns=['metric', 'model',], values=['value'])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "cd89e81c",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dataset_id</th>\n",
       "      <th>tau</th>\n",
       "      <th>model</th>\n",
       "      <th>metric</th>\n",
       "      <th>value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.048754</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>LightGBM</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.178550</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>time_all</td>\n",
       "      <td>1.546284</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.5</td>\n",
       "      <td>SQR</td>\n",
       "      <td>time_all</td>\n",
       "      <td>417.371688</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1027</td>\n",
       "      <td>0.9</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.048657</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>903</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.5</td>\n",
       "      <td>SQR</td>\n",
       "      <td>time_all</td>\n",
       "      <td>859.301180</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>904</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>DecisionTree</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.133787</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>905</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>LightGBM</td>\n",
       "      <td>time_all</td>\n",
       "      <td>0.109384</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>906</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>LinearQuantile</td>\n",
       "      <td>time_all</td>\n",
       "      <td>1.012228</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>907</th>\n",
       "      <td>titanic</td>\n",
       "      <td>0.9</td>\n",
       "      <td>SQR</td>\n",
       "      <td>time_all</td>\n",
       "      <td>903.903540</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>908 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    dataset_id  tau           model    metric       value\n",
       "0         1027  0.5    DecisionTree  time_all    0.048754\n",
       "1         1027  0.5        LightGBM  time_all    0.178550\n",
       "2         1027  0.5  LinearQuantile  time_all    1.546284\n",
       "3         1027  0.5             SQR  time_all  417.371688\n",
       "4         1027  0.9    DecisionTree  time_all    0.048657\n",
       "..         ...  ...             ...       ...         ...\n",
       "903    titanic  0.5             SQR  time_all  859.301180\n",
       "904    titanic  0.9    DecisionTree  time_all    0.133787\n",
       "905    titanic  0.9        LightGBM  time_all    0.109384\n",
       "906    titanic  0.9  LinearQuantile  time_all    1.012228\n",
       "907    titanic  0.9             SQR  time_all  903.903540\n",
       "\n",
       "[908 rows x 5 columns]"
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "id": "2c22ebb9",
   "metadata": {},
   "outputs": [],
   "source": [
    "pivot.to_latex(buf='/tmp/table.tex',float_format=\"%.2f\",longtable=True,multicolumn=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "7814aadc",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr:last-of-type th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"15\" halign=\"left\">value</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>metric</th>\n",
       "      <th colspan=\"3\" halign=\"left\">complexity</th>\n",
       "      <th colspan=\"4\" halign=\"left\">coverage</th>\n",
       "      <th colspan=\"4\" halign=\"left\">losses</th>\n",
       "      <th colspan=\"4\" halign=\"left\">time_all</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>model</th>\n",
       "      <th>DecisionTree</th>\n",
       "      <th>LinearQuantile</th>\n",
       "      <th>SQR</th>\n",
       "      <th>DecisionTree</th>\n",
       "      <th>LightGBM</th>\n",
       "      <th>LinearQuantile</th>\n",
       "      <th>SQR</th>\n",
       "      <th>DecisionTree</th>\n",
       "      <th>LightGBM</th>\n",
       "      <th>LinearQuantile</th>\n",
       "      <th>SQR</th>\n",
       "      <th>DecisionTree</th>\n",
       "      <th>LightGBM</th>\n",
       "      <th>LinearQuantile</th>\n",
       "      <th>SQR</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>tau</th>\n",
       "      <th>dataset_id</th>\n",
       "      <th>$n$</th>\n",
       "      <th>$d$</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">0.5</th>\n",
       "      <th>1027</th>\n",
       "      <th>488</th>\n",
       "      <th>4</th>\n",
       "      <td>127.0</td>\n",
       "      <td>34.0</td>\n",
       "      <td>8.6</td>\n",
       "      <td>0.276667</td>\n",
       "      <td>0.053293</td>\n",
       "      <td>0.018430</td>\n",
       "      <td>0.303261</td>\n",
       "      <td>0.030537</td>\n",
       "      <td>0.038563</td>\n",
       "      <td>0.027710</td>\n",
       "      <td>0.036618</td>\n",
       "      <td>0.048754</td>\n",
       "      <td>0.178550</td>\n",
       "      <td>1.546284</td>\n",
       "      <td>417.371688</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1028</th>\n",
       "      <th>1000</th>\n",
       "      <th>10</th>\n",
       "      <td>101.4</td>\n",
       "      <td>31.0</td>\n",
       "      <td>3.0</td>\n",
       "      <td>0.274000</td>\n",
       "      <td>0.067000</td>\n",
       "      <td>0.027000</td>\n",
       "      <td>0.207000</td>\n",
       "      <td>0.072500</td>\n",
       "      <td>0.081235</td>\n",
       "      <td>0.081431</td>\n",
       "      <td>0.083167</td>\n",
       "      <td>0.064790</td>\n",
       "      <td>0.300018</td>\n",
       "      <td>1.813944</td>\n",
       "      <td>607.824603</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1029</th>\n",
       "      <th>1000</th>\n",
       "      <th>4</th>\n",
       "      <td>165.8</td>\n",
       "      <td>20.0</td>\n",
       "      <td>3.0</td>\n",
       "      <td>0.301000</td>\n",
       "      <td>0.052000</td>\n",
       "      <td>0.031000</td>\n",
       "      <td>0.230000</td>\n",
       "      <td>0.049812</td>\n",
       "      <td>0.066075</td>\n",
       "      <td>0.060289</td>\n",
       "      <td>0.078875</td>\n",
       "      <td>0.079527</td>\n",
       "      <td>0.345356</td>\n",
       "      <td>1.236205</td>\n",
       "      <td>644.401032</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1030</th>\n",
       "      <th>1000</th>\n",
       "      <th>4</th>\n",
       "      <td>42.2</td>\n",
       "      <td>4.0</td>\n",
       "      <td>3.2</td>\n",
       "      <td>0.107000</td>\n",
       "      <td>0.059000</td>\n",
       "      <td>0.052000</td>\n",
       "      <td>0.047000</td>\n",
       "      <td>0.075812</td>\n",
       "      <td>0.077701</td>\n",
       "      <td>0.079377</td>\n",
       "      <td>0.084572</td>\n",
       "      <td>0.037574</td>\n",
       "      <td>0.279260</td>\n",
       "      <td>0.088389</td>\n",
       "      <td>630.110298</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1089</th>\n",
       "      <th>47</th>\n",
       "      <th>13</th>\n",
       "      <td>7.0</td>\n",
       "      <td>14.0</td>\n",
       "      <td>11.2</td>\n",
       "      <td>0.155556</td>\n",
       "      <td>0.095556</td>\n",
       "      <td>0.144444</td>\n",
       "      <td>0.140000</td>\n",
       "      <td>0.063244</td>\n",
       "      <td>0.117830</td>\n",
       "      <td>0.056674</td>\n",
       "      <td>0.058604</td>\n",
       "      <td>0.015354</td>\n",
       "      <td>0.020814</td>\n",
       "      <td>1.940744</td>\n",
       "      <td>278.114929</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <th>...</th>\n",
       "      <th>...</th>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">0.9</th>\n",
       "      <th>695</th>\n",
       "      <th>235</th>\n",
       "      <th>12</th>\n",
       "      <td>14.2</td>\n",
       "      <td>12.0</td>\n",
       "      <td>2.0</td>\n",
       "      <td>0.067660</td>\n",
       "      <td>0.034468</td>\n",
       "      <td>0.052340</td>\n",
       "      <td>0.041277</td>\n",
       "      <td>0.014847</td>\n",
       "      <td>0.018622</td>\n",
       "      <td>0.013100</td>\n",
       "      <td>0.013515</td>\n",
       "      <td>0.032173</td>\n",
       "      <td>0.106865</td>\n",
       "      <td>0.190090</td>\n",
       "      <td>359.216813</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>706</th>\n",
       "      <th>93</th>\n",
       "      <th>6</th>\n",
       "      <td>5.4</td>\n",
       "      <td>11.0</td>\n",
       "      <td>8.6</td>\n",
       "      <td>0.044327</td>\n",
       "      <td>0.016023</td>\n",
       "      <td>0.089708</td>\n",
       "      <td>0.086433</td>\n",
       "      <td>0.026652</td>\n",
       "      <td>0.032751</td>\n",
       "      <td>0.024138</td>\n",
       "      <td>0.020376</td>\n",
       "      <td>0.020010</td>\n",
       "      <td>0.066106</td>\n",
       "      <td>0.847623</td>\n",
       "      <td>300.672056</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>712</th>\n",
       "      <th>222</th>\n",
       "      <th>2</th>\n",
       "      <td>24.6</td>\n",
       "      <td>2.0</td>\n",
       "      <td>3.2</td>\n",
       "      <td>0.039798</td>\n",
       "      <td>0.079798</td>\n",
       "      <td>0.106869</td>\n",
       "      <td>0.052626</td>\n",
       "      <td>0.021857</td>\n",
       "      <td>0.023223</td>\n",
       "      <td>0.059274</td>\n",
       "      <td>0.023099</td>\n",
       "      <td>0.025992</td>\n",
       "      <td>0.117049</td>\n",
       "      <td>0.064099</td>\n",
       "      <td>376.738821</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>banana</th>\n",
       "      <th>5300</th>\n",
       "      <th>2</th>\n",
       "      <td>146.6</td>\n",
       "      <td>2.0</td>\n",
       "      <td>12.6</td>\n",
       "      <td>0.087547</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>0.635283</td>\n",
       "      <td>0.346415</td>\n",
       "      <td>0.027938</td>\n",
       "      <td>0.055170</td>\n",
       "      <td>0.403472</td>\n",
       "      <td>0.036330</td>\n",
       "      <td>0.201511</td>\n",
       "      <td>0.131165</td>\n",
       "      <td>0.045424</td>\n",
       "      <td>2140.997827</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>titanic</th>\n",
       "      <th>2099</th>\n",
       "      <th>8</th>\n",
       "      <td>87.4</td>\n",
       "      <td>31.0</td>\n",
       "      <td>3.2</td>\n",
       "      <td>0.069031</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>0.119637</td>\n",
       "      <td>0.098571</td>\n",
       "      <td>0.070219</td>\n",
       "      <td>0.067556</td>\n",
       "      <td>0.065554</td>\n",
       "      <td>0.065696</td>\n",
       "      <td>0.133787</td>\n",
       "      <td>0.109384</td>\n",
       "      <td>1.012228</td>\n",
       "      <td>903.903540</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>228 rows × 15 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                               value                                    \\\n",
       "metric                    complexity                          coverage   \n",
       "model                   DecisionTree LinearQuantile   SQR DecisionTree   \n",
       "tau dataset_id $n$  $d$                                                  \n",
       "0.5 1027       488  4          127.0           34.0   8.6     0.276667   \n",
       "    1028       1000 10         101.4           31.0   3.0     0.274000   \n",
       "    1029       1000 4          165.8           20.0   3.0     0.301000   \n",
       "    1030       1000 4           42.2            4.0   3.2     0.107000   \n",
       "    1089       47   13           7.0           14.0  11.2     0.155556   \n",
       "...                              ...            ...   ...          ...   \n",
       "0.9 695        235  12          14.2           12.0   2.0     0.067660   \n",
       "    706        93   6            5.4           11.0   8.6     0.044327   \n",
       "    712        222  2           24.6            2.0   3.2     0.039798   \n",
       "    banana     5300 2          146.6            2.0  12.6     0.087547   \n",
       "    titanic    2099 8           87.4           31.0   3.2     0.069031   \n",
       "\n",
       "                                                                         \\\n",
       "metric                                                           losses   \n",
       "model                    LightGBM LinearQuantile       SQR DecisionTree   \n",
       "tau dataset_id $n$  $d$                                                   \n",
       "0.5 1027       488  4    0.053293       0.018430  0.303261     0.030537   \n",
       "    1028       1000 10   0.067000       0.027000  0.207000     0.072500   \n",
       "    1029       1000 4    0.052000       0.031000  0.230000     0.049812   \n",
       "    1030       1000 4    0.059000       0.052000  0.047000     0.075812   \n",
       "    1089       47   13   0.095556       0.144444  0.140000     0.063244   \n",
       "...                           ...            ...       ...          ...   \n",
       "0.9 695        235  12   0.034468       0.052340  0.041277     0.014847   \n",
       "    706        93   6    0.016023       0.089708  0.086433     0.026652   \n",
       "    712        222  2    0.079798       0.106869  0.052626     0.021857   \n",
       "    banana     5300 2    0.100000       0.635283  0.346415     0.027938   \n",
       "    titanic    2099 8    0.100000       0.119637  0.098571     0.070219   \n",
       "\n",
       "                                                                         \\\n",
       "metric                                                         time_all   \n",
       "model                    LightGBM LinearQuantile       SQR DecisionTree   \n",
       "tau dataset_id $n$  $d$                                                   \n",
       "0.5 1027       488  4    0.038563       0.027710  0.036618     0.048754   \n",
       "    1028       1000 10   0.081235       0.081431  0.083167     0.064790   \n",
       "    1029       1000 4    0.066075       0.060289  0.078875     0.079527   \n",
       "    1030       1000 4    0.077701       0.079377  0.084572     0.037574   \n",
       "    1089       47   13   0.117830       0.056674  0.058604     0.015354   \n",
       "...                           ...            ...       ...          ...   \n",
       "0.9 695        235  12   0.018622       0.013100  0.013515     0.032173   \n",
       "    706        93   6    0.032751       0.024138  0.020376     0.020010   \n",
       "    712        222  2    0.023223       0.059274  0.023099     0.025992   \n",
       "    banana     5300 2    0.055170       0.403472  0.036330     0.201511   \n",
       "    titanic    2099 8    0.067556       0.065554  0.065696     0.133787   \n",
       "\n",
       "                                                               \n",
       "metric                                                         \n",
       "model                    LightGBM LinearQuantile          SQR  \n",
       "tau dataset_id $n$  $d$                                        \n",
       "0.5 1027       488  4    0.178550       1.546284   417.371688  \n",
       "    1028       1000 10   0.300018       1.813944   607.824603  \n",
       "    1029       1000 4    0.345356       1.236205   644.401032  \n",
       "    1030       1000 4    0.279260       0.088389   630.110298  \n",
       "    1089       47   13   0.020814       1.940744   278.114929  \n",
       "...                           ...            ...          ...  \n",
       "0.9 695        235  12   0.106865       0.190090   359.216813  \n",
       "    706        93   6    0.066106       0.847623   300.672056  \n",
       "    712        222  2    0.117049       0.064099   376.738821  \n",
       "    banana     5300 2    0.131165       0.045424  2140.997827  \n",
       "    titanic    2099 8    0.109384       1.012228   903.903540  \n",
       "\n",
       "[228 rows x 15 columns]"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pivot"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "cb2fe9e2",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "sqr-noversion",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
