{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "from pkg.utils.analyze import summarize_outputs_in_df\n",
    "\n",
    "sweep_path = \"/home/knowledge-tracing/ktst/sweeps/ablation_assist2009\"\n",
    "train_path = \"/home/knowledge-tracing/ktst/ablation_attention_assist2009/train\"\n",
    "test_path = \"/home/knowledge-tracing/ktst/ablation_attention_assist2009/eval\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>val_time</th>\n",
       "      <th>val_metric</th>\n",
       "      <th>val_auc</th>\n",
       "      <th>val_accuracy</th>\n",
       "      <th>val_epoch_mean_loss</th>\n",
       "      <th>epoch</th>\n",
       "      <th>iteration</th>\n",
       "      <th>trainable_params</th>\n",
       "      <th>best_iteration</th>\n",
       "      <th>...</th>\n",
       "      <th>data.batch_size_val</th>\n",
       "      <th>data.val_fold_idx</th>\n",
       "      <th>optimizer._target_</th>\n",
       "      <th>optimizer._recursive_</th>\n",
       "      <th>optimizer.lr</th>\n",
       "      <th>optimizer.weight_decay</th>\n",
       "      <th>trainer.log_after_num_iterations</th>\n",
       "      <th>optimizer.theta_lr</th>\n",
       "      <th>run_dir</th>\n",
       "      <th>outputs_dir</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>0.980277</td>\n",
       "      <td>0.777942</td>\n",
       "      <td>0.777942</td>\n",
       "      <td>0.743306</td>\n",
       "      <td>0.524501</td>\n",
       "      <td>25</td>\n",
       "      <td>600</td>\n",
       "      <td>10306145</td>\n",
       "      <td>600</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>1</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00010</td>\n",
       "      <td>0.00001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0</td>\n",
       "      <td>0.672466</td>\n",
       "      <td>0.777685</td>\n",
       "      <td>0.777685</td>\n",
       "      <td>0.744762</td>\n",
       "      <td>0.531637</td>\n",
       "      <td>67</td>\n",
       "      <td>1608</td>\n",
       "      <td>3876921</td>\n",
       "      <td>1608</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>1</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00005</td>\n",
       "      <td>0.00005</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0</td>\n",
       "      <td>0.811379</td>\n",
       "      <td>0.778648</td>\n",
       "      <td>0.778648</td>\n",
       "      <td>0.745080</td>\n",
       "      <td>0.530989</td>\n",
       "      <td>26</td>\n",
       "      <td>624</td>\n",
       "      <td>9783101</td>\n",
       "      <td>624</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>1</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00010</td>\n",
       "      <td>0.00001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0</td>\n",
       "      <td>1.079332</td>\n",
       "      <td>0.778887</td>\n",
       "      <td>0.778887</td>\n",
       "      <td>0.744489</td>\n",
       "      <td>0.527889</td>\n",
       "      <td>28</td>\n",
       "      <td>672</td>\n",
       "      <td>10207713</td>\n",
       "      <td>672</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>1</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00010</td>\n",
       "      <td>0.00005</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0</td>\n",
       "      <td>1.016201</td>\n",
       "      <td>0.780656</td>\n",
       "      <td>0.780656</td>\n",
       "      <td>0.745831</td>\n",
       "      <td>0.523404</td>\n",
       "      <td>53</td>\n",
       "      <td>1272</td>\n",
       "      <td>10476229</td>\n",
       "      <td>1272</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>1</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00005</td>\n",
       "      <td>0.00005</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3495</th>\n",
       "      <td>0</td>\n",
       "      <td>0.300478</td>\n",
       "      <td>0.760989</td>\n",
       "      <td>0.760989</td>\n",
       "      <td>0.725194</td>\n",
       "      <td>0.544136</td>\n",
       "      <td>76</td>\n",
       "      <td>1824</td>\n",
       "      <td>3413121</td>\n",
       "      <td>1824</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>4</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00010</td>\n",
       "      <td>0.00001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3496</th>\n",
       "      <td>0</td>\n",
       "      <td>0.354748</td>\n",
       "      <td>0.761144</td>\n",
       "      <td>0.761144</td>\n",
       "      <td>0.725617</td>\n",
       "      <td>0.546149</td>\n",
       "      <td>154</td>\n",
       "      <td>3696</td>\n",
       "      <td>3810561</td>\n",
       "      <td>3696</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>4</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00005</td>\n",
       "      <td>0.00001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3497</th>\n",
       "      <td>0</td>\n",
       "      <td>0.296390</td>\n",
       "      <td>0.764528</td>\n",
       "      <td>0.764528</td>\n",
       "      <td>0.727643</td>\n",
       "      <td>0.544219</td>\n",
       "      <td>85</td>\n",
       "      <td>2040</td>\n",
       "      <td>3413121</td>\n",
       "      <td>2040</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>4</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00010</td>\n",
       "      <td>0.00001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3498</th>\n",
       "      <td>0</td>\n",
       "      <td>0.295143</td>\n",
       "      <td>0.761737</td>\n",
       "      <td>0.761737</td>\n",
       "      <td>0.728378</td>\n",
       "      <td>0.546384</td>\n",
       "      <td>83</td>\n",
       "      <td>1992</td>\n",
       "      <td>3413121</td>\n",
       "      <td>1992</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>4</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00010</td>\n",
       "      <td>0.00001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3499</th>\n",
       "      <td>0</td>\n",
       "      <td>0.289474</td>\n",
       "      <td>0.763670</td>\n",
       "      <td>0.763670</td>\n",
       "      <td>0.726908</td>\n",
       "      <td>0.545659</td>\n",
       "      <td>82</td>\n",
       "      <td>1968</td>\n",
       "      <td>3413121</td>\n",
       "      <td>1968</td>\n",
       "      <td>...</td>\n",
       "      <td>64</td>\n",
       "      <td>4</td>\n",
       "      <td>torch.optim.Adam</td>\n",
       "      <td>False</td>\n",
       "      <td>0.00010</td>\n",
       "      <td>0.00001</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "      <td>/home/knowledge-tracing/ktst/sweeps/ablation_a...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>3500 rows × 54 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      index  val_time  val_metric   val_auc  val_accuracy  \\\n",
       "0         0  0.980277    0.777942  0.777942      0.743306   \n",
       "1         0  0.672466    0.777685  0.777685      0.744762   \n",
       "2         0  0.811379    0.778648  0.778648      0.745080   \n",
       "3         0  1.079332    0.778887  0.778887      0.744489   \n",
       "4         0  1.016201    0.780656  0.780656      0.745831   \n",
       "...     ...       ...         ...       ...           ...   \n",
       "3495      0  0.300478    0.760989  0.760989      0.725194   \n",
       "3496      0  0.354748    0.761144  0.761144      0.725617   \n",
       "3497      0  0.296390    0.764528  0.764528      0.727643   \n",
       "3498      0  0.295143    0.761737  0.761737      0.728378   \n",
       "3499      0  0.289474    0.763670  0.763670      0.726908   \n",
       "\n",
       "      val_epoch_mean_loss  epoch  iteration  trainable_params  best_iteration  \\\n",
       "0                0.524501     25        600          10306145             600   \n",
       "1                0.531637     67       1608           3876921            1608   \n",
       "2                0.530989     26        624           9783101             624   \n",
       "3                0.527889     28        672          10207713             672   \n",
       "4                0.523404     53       1272          10476229            1272   \n",
       "...                   ...    ...        ...               ...             ...   \n",
       "3495             0.544136     76       1824           3413121            1824   \n",
       "3496             0.546149    154       3696           3810561            3696   \n",
       "3497             0.544219     85       2040           3413121            2040   \n",
       "3498             0.546384     83       1992           3413121            1992   \n",
       "3499             0.545659     82       1968           3413121            1968   \n",
       "\n",
       "      ...  data.batch_size_val data.val_fold_idx  optimizer._target_  \\\n",
       "0     ...                   64                 1    torch.optim.Adam   \n",
       "1     ...                   64                 1    torch.optim.Adam   \n",
       "2     ...                   64                 1    torch.optim.Adam   \n",
       "3     ...                   64                 1    torch.optim.Adam   \n",
       "4     ...                   64                 1    torch.optim.Adam   \n",
       "...   ...                  ...               ...                 ...   \n",
       "3495  ...                   64                 4    torch.optim.Adam   \n",
       "3496  ...                   64                 4    torch.optim.Adam   \n",
       "3497  ...                   64                 4    torch.optim.Adam   \n",
       "3498  ...                   64                 4    torch.optim.Adam   \n",
       "3499  ...                   64                 4    torch.optim.Adam   \n",
       "\n",
       "      optimizer._recursive_ optimizer.lr optimizer.weight_decay  \\\n",
       "0                     False      0.00010                0.00001   \n",
       "1                     False      0.00005                0.00005   \n",
       "2                     False      0.00010                0.00001   \n",
       "3                     False      0.00010                0.00005   \n",
       "4                     False      0.00005                0.00005   \n",
       "...                     ...          ...                    ...   \n",
       "3495                  False      0.00010                0.00001   \n",
       "3496                  False      0.00005                0.00001   \n",
       "3497                  False      0.00010                0.00001   \n",
       "3498                  False      0.00010                0.00001   \n",
       "3499                  False      0.00010                0.00001   \n",
       "\n",
       "      trainer.log_after_num_iterations  optimizer.theta_lr  \\\n",
       "0                                  NaN                 NaN   \n",
       "1                                  NaN                 NaN   \n",
       "2                                  NaN                 NaN   \n",
       "3                                  NaN                 NaN   \n",
       "4                                  NaN                 NaN   \n",
       "...                                ...                 ...   \n",
       "3495                               NaN                 NaN   \n",
       "3496                               NaN                 NaN   \n",
       "3497                               NaN                 NaN   \n",
       "3498                               NaN                 NaN   \n",
       "3499                               NaN                 NaN   \n",
       "\n",
       "                                                run_dir  \\\n",
       "0     /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "1     /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "2     /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "3     /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "4     /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "...                                                 ...   \n",
       "3495  /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "3496  /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "3497  /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "3498  /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "3499  /home/knowledge-tracing/ktst/sweeps/ablation_a...   \n",
       "\n",
       "                                            outputs_dir  \n",
       "0     /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "1     /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "2     /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "3     /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "4     /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "...                                                 ...  \n",
       "3495  /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "3496  /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "3497  /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "3498  /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "3499  /home/knowledge-tracing/ktst/sweeps/ablation_a...  \n",
       "\n",
       "[3500 rows x 54 columns]"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# sweep\n",
    "df_sweep = summarize_outputs_in_df(outputs_dir=sweep_path)\n",
    "df_sweep"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr:last-of-type th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">val_auc</th>\n",
       "      <th colspan=\"4\" halign=\"left\">val_accuracy</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>max</th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "      <th>count</th>\n",
       "      <th>max</th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "      <th>count</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>model.attn_variant</th>\n",
       "      <th>model.use_decoder_only</th>\n",
       "      <th>data.val_fold_idx</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">akt_monotonic</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.792770</td>\n",
       "      <td>0.790117</td>\n",
       "      <td>0.001017</td>\n",
       "      <td>100</td>\n",
       "      <td>0.754023</td>\n",
       "      <td>0.749878</td>\n",
       "      <td>0.001297</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.782070</td>\n",
       "      <td>0.779797</td>\n",
       "      <td>0.000958</td>\n",
       "      <td>100</td>\n",
       "      <td>0.749312</td>\n",
       "      <td>0.745202</td>\n",
       "      <td>0.001267</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.790613</td>\n",
       "      <td>0.788539</td>\n",
       "      <td>0.001086</td>\n",
       "      <td>100</td>\n",
       "      <td>0.757135</td>\n",
       "      <td>0.754504</td>\n",
       "      <td>0.001171</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.784018</td>\n",
       "      <td>0.782174</td>\n",
       "      <td>0.001119</td>\n",
       "      <td>100</td>\n",
       "      <td>0.749845</td>\n",
       "      <td>0.747789</td>\n",
       "      <td>0.001161</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.789966</td>\n",
       "      <td>0.787996</td>\n",
       "      <td>0.000871</td>\n",
       "      <td>100</td>\n",
       "      <td>0.746099</td>\n",
       "      <td>0.744027</td>\n",
       "      <td>0.000947</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">alibi_monotonic</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.790275</td>\n",
       "      <td>0.787933</td>\n",
       "      <td>0.001720</td>\n",
       "      <td>100</td>\n",
       "      <td>0.752402</td>\n",
       "      <td>0.748486</td>\n",
       "      <td>0.001660</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.780984</td>\n",
       "      <td>0.777518</td>\n",
       "      <td>0.001630</td>\n",
       "      <td>100</td>\n",
       "      <td>0.746718</td>\n",
       "      <td>0.743654</td>\n",
       "      <td>0.001751</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.790900</td>\n",
       "      <td>0.787472</td>\n",
       "      <td>0.001754</td>\n",
       "      <td>100</td>\n",
       "      <td>0.757271</td>\n",
       "      <td>0.753833</td>\n",
       "      <td>0.001483</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.781265</td>\n",
       "      <td>0.778538</td>\n",
       "      <td>0.001615</td>\n",
       "      <td>100</td>\n",
       "      <td>0.749183</td>\n",
       "      <td>0.746051</td>\n",
       "      <td>0.001777</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.788992</td>\n",
       "      <td>0.785833</td>\n",
       "      <td>0.001827</td>\n",
       "      <td>100</td>\n",
       "      <td>0.746455</td>\n",
       "      <td>0.743032</td>\n",
       "      <td>0.001912</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">alibi_monotonic_q_k</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.793804</td>\n",
       "      <td>0.791580</td>\n",
       "      <td>0.001095</td>\n",
       "      <td>100</td>\n",
       "      <td>0.754162</td>\n",
       "      <td>0.751329</td>\n",
       "      <td>0.001288</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.783544</td>\n",
       "      <td>0.781715</td>\n",
       "      <td>0.000805</td>\n",
       "      <td>100</td>\n",
       "      <td>0.747924</td>\n",
       "      <td>0.745775</td>\n",
       "      <td>0.001477</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.793501</td>\n",
       "      <td>0.790693</td>\n",
       "      <td>0.001403</td>\n",
       "      <td>100</td>\n",
       "      <td>0.758570</td>\n",
       "      <td>0.755721</td>\n",
       "      <td>0.001545</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.785331</td>\n",
       "      <td>0.783608</td>\n",
       "      <td>0.000870</td>\n",
       "      <td>100</td>\n",
       "      <td>0.752271</td>\n",
       "      <td>0.748832</td>\n",
       "      <td>0.001313</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.791253</td>\n",
       "      <td>0.789156</td>\n",
       "      <td>0.000898</td>\n",
       "      <td>100</td>\n",
       "      <td>0.748570</td>\n",
       "      <td>0.745418</td>\n",
       "      <td>0.001366</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">learnable_alibi_monotonic</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.793072</td>\n",
       "      <td>0.789914</td>\n",
       "      <td>0.002052</td>\n",
       "      <td>100</td>\n",
       "      <td>0.752981</td>\n",
       "      <td>0.750036</td>\n",
       "      <td>0.001750</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.781978</td>\n",
       "      <td>0.778830</td>\n",
       "      <td>0.001899</td>\n",
       "      <td>100</td>\n",
       "      <td>0.747173</td>\n",
       "      <td>0.744396</td>\n",
       "      <td>0.001807</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.791497</td>\n",
       "      <td>0.788075</td>\n",
       "      <td>0.002009</td>\n",
       "      <td>100</td>\n",
       "      <td>0.757886</td>\n",
       "      <td>0.754175</td>\n",
       "      <td>0.001788</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.783647</td>\n",
       "      <td>0.780537</td>\n",
       "      <td>0.002142</td>\n",
       "      <td>100</td>\n",
       "      <td>0.750867</td>\n",
       "      <td>0.747231</td>\n",
       "      <td>0.001625</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.789349</td>\n",
       "      <td>0.786730</td>\n",
       "      <td>0.001716</td>\n",
       "      <td>100</td>\n",
       "      <td>0.746544</td>\n",
       "      <td>0.743723</td>\n",
       "      <td>0.001382</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"10\" valign=\"top\">learnable_alibi_monotonic_q_k</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.794550</td>\n",
       "      <td>0.792333</td>\n",
       "      <td>0.000984</td>\n",
       "      <td>100</td>\n",
       "      <td>0.754717</td>\n",
       "      <td>0.751714</td>\n",
       "      <td>0.001281</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.784062</td>\n",
       "      <td>0.782028</td>\n",
       "      <td>0.000892</td>\n",
       "      <td>100</td>\n",
       "      <td>0.748493</td>\n",
       "      <td>0.745896</td>\n",
       "      <td>0.001204</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.793899</td>\n",
       "      <td>0.791236</td>\n",
       "      <td>0.001375</td>\n",
       "      <td>100</td>\n",
       "      <td>0.759002</td>\n",
       "      <td>0.756131</td>\n",
       "      <td>0.001650</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.785811</td>\n",
       "      <td>0.783962</td>\n",
       "      <td>0.000970</td>\n",
       "      <td>100</td>\n",
       "      <td>0.752031</td>\n",
       "      <td>0.748938</td>\n",
       "      <td>0.001357</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.791716</td>\n",
       "      <td>0.789841</td>\n",
       "      <td>0.001024</td>\n",
       "      <td>100</td>\n",
       "      <td>0.748147</td>\n",
       "      <td>0.746092</td>\n",
       "      <td>0.001334</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">True</th>\n",
       "      <th>0</th>\n",
       "      <td>0.793369</td>\n",
       "      <td>0.791436</td>\n",
       "      <td>0.001234</td>\n",
       "      <td>100</td>\n",
       "      <td>0.754254</td>\n",
       "      <td>0.751224</td>\n",
       "      <td>0.001250</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.783265</td>\n",
       "      <td>0.780874</td>\n",
       "      <td>0.001052</td>\n",
       "      <td>100</td>\n",
       "      <td>0.747947</td>\n",
       "      <td>0.744995</td>\n",
       "      <td>0.001480</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.792105</td>\n",
       "      <td>0.789777</td>\n",
       "      <td>0.001353</td>\n",
       "      <td>100</td>\n",
       "      <td>0.757886</td>\n",
       "      <td>0.755161</td>\n",
       "      <td>0.001465</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.784848</td>\n",
       "      <td>0.783095</td>\n",
       "      <td>0.001371</td>\n",
       "      <td>100</td>\n",
       "      <td>0.751128</td>\n",
       "      <td>0.748107</td>\n",
       "      <td>0.001619</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.790955</td>\n",
       "      <td>0.789014</td>\n",
       "      <td>0.001059</td>\n",
       "      <td>100</td>\n",
       "      <td>0.748147</td>\n",
       "      <td>0.745352</td>\n",
       "      <td>0.001453</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">standard</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.770023</td>\n",
       "      <td>0.762052</td>\n",
       "      <td>0.006831</td>\n",
       "      <td>100</td>\n",
       "      <td>0.738325</td>\n",
       "      <td>0.733258</td>\n",
       "      <td>0.003269</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.761767</td>\n",
       "      <td>0.754138</td>\n",
       "      <td>0.006675</td>\n",
       "      <td>100</td>\n",
       "      <td>0.733932</td>\n",
       "      <td>0.728144</td>\n",
       "      <td>0.003245</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.773836</td>\n",
       "      <td>0.765367</td>\n",
       "      <td>0.006770</td>\n",
       "      <td>100</td>\n",
       "      <td>0.744676</td>\n",
       "      <td>0.739512</td>\n",
       "      <td>0.002738</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.765727</td>\n",
       "      <td>0.757583</td>\n",
       "      <td>0.005812</td>\n",
       "      <td>100</td>\n",
       "      <td>0.738954</td>\n",
       "      <td>0.733983</td>\n",
       "      <td>0.002844</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.766297</td>\n",
       "      <td>0.759343</td>\n",
       "      <td>0.005689</td>\n",
       "      <td>100</td>\n",
       "      <td>0.731027</td>\n",
       "      <td>0.725883</td>\n",
       "      <td>0.002904</td>\n",
       "      <td>100</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                                         val_auc  \\\n",
       "                                                                             max   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx             \n",
       "akt_monotonic                 False                  0                  0.792770   \n",
       "                                                     1                  0.782070   \n",
       "                                                     2                  0.790613   \n",
       "                                                     3                  0.784018   \n",
       "                                                     4                  0.789966   \n",
       "alibi_monotonic               False                  0                  0.790275   \n",
       "                                                     1                  0.780984   \n",
       "                                                     2                  0.790900   \n",
       "                                                     3                  0.781265   \n",
       "                                                     4                  0.788992   \n",
       "alibi_monotonic_q_k           False                  0                  0.793804   \n",
       "                                                     1                  0.783544   \n",
       "                                                     2                  0.793501   \n",
       "                                                     3                  0.785331   \n",
       "                                                     4                  0.791253   \n",
       "learnable_alibi_monotonic     False                  0                  0.793072   \n",
       "                                                     1                  0.781978   \n",
       "                                                     2                  0.791497   \n",
       "                                                     3                  0.783647   \n",
       "                                                     4                  0.789349   \n",
       "learnable_alibi_monotonic_q_k False                  0                  0.794550   \n",
       "                                                     1                  0.784062   \n",
       "                                                     2                  0.793899   \n",
       "                                                     3                  0.785811   \n",
       "                                                     4                  0.791716   \n",
       "                              True                   0                  0.793369   \n",
       "                                                     1                  0.783265   \n",
       "                                                     2                  0.792105   \n",
       "                                                     3                  0.784848   \n",
       "                                                     4                  0.790955   \n",
       "standard                      False                  0                  0.770023   \n",
       "                                                     1                  0.761767   \n",
       "                                                     2                  0.773836   \n",
       "                                                     3                  0.765727   \n",
       "                                                     4                  0.766297   \n",
       "\n",
       "                                                                                  \\\n",
       "                                                                            mean   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx             \n",
       "akt_monotonic                 False                  0                  0.790117   \n",
       "                                                     1                  0.779797   \n",
       "                                                     2                  0.788539   \n",
       "                                                     3                  0.782174   \n",
       "                                                     4                  0.787996   \n",
       "alibi_monotonic               False                  0                  0.787933   \n",
       "                                                     1                  0.777518   \n",
       "                                                     2                  0.787472   \n",
       "                                                     3                  0.778538   \n",
       "                                                     4                  0.785833   \n",
       "alibi_monotonic_q_k           False                  0                  0.791580   \n",
       "                                                     1                  0.781715   \n",
       "                                                     2                  0.790693   \n",
       "                                                     3                  0.783608   \n",
       "                                                     4                  0.789156   \n",
       "learnable_alibi_monotonic     False                  0                  0.789914   \n",
       "                                                     1                  0.778830   \n",
       "                                                     2                  0.788075   \n",
       "                                                     3                  0.780537   \n",
       "                                                     4                  0.786730   \n",
       "learnable_alibi_monotonic_q_k False                  0                  0.792333   \n",
       "                                                     1                  0.782028   \n",
       "                                                     2                  0.791236   \n",
       "                                                     3                  0.783962   \n",
       "                                                     4                  0.789841   \n",
       "                              True                   0                  0.791436   \n",
       "                                                     1                  0.780874   \n",
       "                                                     2                  0.789777   \n",
       "                                                     3                  0.783095   \n",
       "                                                     4                  0.789014   \n",
       "standard                      False                  0                  0.762052   \n",
       "                                                     1                  0.754138   \n",
       "                                                     2                  0.765367   \n",
       "                                                     3                  0.757583   \n",
       "                                                     4                  0.759343   \n",
       "\n",
       "                                                                                  \\\n",
       "                                                                             std   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx             \n",
       "akt_monotonic                 False                  0                  0.001017   \n",
       "                                                     1                  0.000958   \n",
       "                                                     2                  0.001086   \n",
       "                                                     3                  0.001119   \n",
       "                                                     4                  0.000871   \n",
       "alibi_monotonic               False                  0                  0.001720   \n",
       "                                                     1                  0.001630   \n",
       "                                                     2                  0.001754   \n",
       "                                                     3                  0.001615   \n",
       "                                                     4                  0.001827   \n",
       "alibi_monotonic_q_k           False                  0                  0.001095   \n",
       "                                                     1                  0.000805   \n",
       "                                                     2                  0.001403   \n",
       "                                                     3                  0.000870   \n",
       "                                                     4                  0.000898   \n",
       "learnable_alibi_monotonic     False                  0                  0.002052   \n",
       "                                                     1                  0.001899   \n",
       "                                                     2                  0.002009   \n",
       "                                                     3                  0.002142   \n",
       "                                                     4                  0.001716   \n",
       "learnable_alibi_monotonic_q_k False                  0                  0.000984   \n",
       "                                                     1                  0.000892   \n",
       "                                                     2                  0.001375   \n",
       "                                                     3                  0.000970   \n",
       "                                                     4                  0.001024   \n",
       "                              True                   0                  0.001234   \n",
       "                                                     1                  0.001052   \n",
       "                                                     2                  0.001353   \n",
       "                                                     3                  0.001371   \n",
       "                                                     4                  0.001059   \n",
       "standard                      False                  0                  0.006831   \n",
       "                                                     1                  0.006675   \n",
       "                                                     2                  0.006770   \n",
       "                                                     3                  0.005812   \n",
       "                                                     4                  0.005689   \n",
       "\n",
       "                                                                              \\\n",
       "                                                                       count   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx         \n",
       "akt_monotonic                 False                  0                   100   \n",
       "                                                     1                   100   \n",
       "                                                     2                   100   \n",
       "                                                     3                   100   \n",
       "                                                     4                   100   \n",
       "alibi_monotonic               False                  0                   100   \n",
       "                                                     1                   100   \n",
       "                                                     2                   100   \n",
       "                                                     3                   100   \n",
       "                                                     4                   100   \n",
       "alibi_monotonic_q_k           False                  0                   100   \n",
       "                                                     1                   100   \n",
       "                                                     2                   100   \n",
       "                                                     3                   100   \n",
       "                                                     4                   100   \n",
       "learnable_alibi_monotonic     False                  0                   100   \n",
       "                                                     1                   100   \n",
       "                                                     2                   100   \n",
       "                                                     3                   100   \n",
       "                                                     4                   100   \n",
       "learnable_alibi_monotonic_q_k False                  0                   100   \n",
       "                                                     1                   100   \n",
       "                                                     2                   100   \n",
       "                                                     3                   100   \n",
       "                                                     4                   100   \n",
       "                              True                   0                   100   \n",
       "                                                     1                   100   \n",
       "                                                     2                   100   \n",
       "                                                     3                   100   \n",
       "                                                     4                   100   \n",
       "standard                      False                  0                   100   \n",
       "                                                     1                   100   \n",
       "                                                     2                   100   \n",
       "                                                     3                   100   \n",
       "                                                     4                   100   \n",
       "\n",
       "                                                                       val_accuracy  \\\n",
       "                                                                                max   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx                \n",
       "akt_monotonic                 False                  0                     0.754023   \n",
       "                                                     1                     0.749312   \n",
       "                                                     2                     0.757135   \n",
       "                                                     3                     0.749845   \n",
       "                                                     4                     0.746099   \n",
       "alibi_monotonic               False                  0                     0.752402   \n",
       "                                                     1                     0.746718   \n",
       "                                                     2                     0.757271   \n",
       "                                                     3                     0.749183   \n",
       "                                                     4                     0.746455   \n",
       "alibi_monotonic_q_k           False                  0                     0.754162   \n",
       "                                                     1                     0.747924   \n",
       "                                                     2                     0.758570   \n",
       "                                                     3                     0.752271   \n",
       "                                                     4                     0.748570   \n",
       "learnable_alibi_monotonic     False                  0                     0.752981   \n",
       "                                                     1                     0.747173   \n",
       "                                                     2                     0.757886   \n",
       "                                                     3                     0.750867   \n",
       "                                                     4                     0.746544   \n",
       "learnable_alibi_monotonic_q_k False                  0                     0.754717   \n",
       "                                                     1                     0.748493   \n",
       "                                                     2                     0.759002   \n",
       "                                                     3                     0.752031   \n",
       "                                                     4                     0.748147   \n",
       "                              True                   0                     0.754254   \n",
       "                                                     1                     0.747947   \n",
       "                                                     2                     0.757886   \n",
       "                                                     3                     0.751128   \n",
       "                                                     4                     0.748147   \n",
       "standard                      False                  0                     0.738325   \n",
       "                                                     1                     0.733932   \n",
       "                                                     2                     0.744676   \n",
       "                                                     3                     0.738954   \n",
       "                                                     4                     0.731027   \n",
       "\n",
       "                                                                                  \\\n",
       "                                                                            mean   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx             \n",
       "akt_monotonic                 False                  0                  0.749878   \n",
       "                                                     1                  0.745202   \n",
       "                                                     2                  0.754504   \n",
       "                                                     3                  0.747789   \n",
       "                                                     4                  0.744027   \n",
       "alibi_monotonic               False                  0                  0.748486   \n",
       "                                                     1                  0.743654   \n",
       "                                                     2                  0.753833   \n",
       "                                                     3                  0.746051   \n",
       "                                                     4                  0.743032   \n",
       "alibi_monotonic_q_k           False                  0                  0.751329   \n",
       "                                                     1                  0.745775   \n",
       "                                                     2                  0.755721   \n",
       "                                                     3                  0.748832   \n",
       "                                                     4                  0.745418   \n",
       "learnable_alibi_monotonic     False                  0                  0.750036   \n",
       "                                                     1                  0.744396   \n",
       "                                                     2                  0.754175   \n",
       "                                                     3                  0.747231   \n",
       "                                                     4                  0.743723   \n",
       "learnable_alibi_monotonic_q_k False                  0                  0.751714   \n",
       "                                                     1                  0.745896   \n",
       "                                                     2                  0.756131   \n",
       "                                                     3                  0.748938   \n",
       "                                                     4                  0.746092   \n",
       "                              True                   0                  0.751224   \n",
       "                                                     1                  0.744995   \n",
       "                                                     2                  0.755161   \n",
       "                                                     3                  0.748107   \n",
       "                                                     4                  0.745352   \n",
       "standard                      False                  0                  0.733258   \n",
       "                                                     1                  0.728144   \n",
       "                                                     2                  0.739512   \n",
       "                                                     3                  0.733983   \n",
       "                                                     4                  0.725883   \n",
       "\n",
       "                                                                                  \\\n",
       "                                                                             std   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx             \n",
       "akt_monotonic                 False                  0                  0.001297   \n",
       "                                                     1                  0.001267   \n",
       "                                                     2                  0.001171   \n",
       "                                                     3                  0.001161   \n",
       "                                                     4                  0.000947   \n",
       "alibi_monotonic               False                  0                  0.001660   \n",
       "                                                     1                  0.001751   \n",
       "                                                     2                  0.001483   \n",
       "                                                     3                  0.001777   \n",
       "                                                     4                  0.001912   \n",
       "alibi_monotonic_q_k           False                  0                  0.001288   \n",
       "                                                     1                  0.001477   \n",
       "                                                     2                  0.001545   \n",
       "                                                     3                  0.001313   \n",
       "                                                     4                  0.001366   \n",
       "learnable_alibi_monotonic     False                  0                  0.001750   \n",
       "                                                     1                  0.001807   \n",
       "                                                     2                  0.001788   \n",
       "                                                     3                  0.001625   \n",
       "                                                     4                  0.001382   \n",
       "learnable_alibi_monotonic_q_k False                  0                  0.001281   \n",
       "                                                     1                  0.001204   \n",
       "                                                     2                  0.001650   \n",
       "                                                     3                  0.001357   \n",
       "                                                     4                  0.001334   \n",
       "                              True                   0                  0.001250   \n",
       "                                                     1                  0.001480   \n",
       "                                                     2                  0.001465   \n",
       "                                                     3                  0.001619   \n",
       "                                                     4                  0.001453   \n",
       "standard                      False                  0                  0.003269   \n",
       "                                                     1                  0.003245   \n",
       "                                                     2                  0.002738   \n",
       "                                                     3                  0.002844   \n",
       "                                                     4                  0.002904   \n",
       "\n",
       "                                                                              \n",
       "                                                                       count  \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx        \n",
       "akt_monotonic                 False                  0                   100  \n",
       "                                                     1                   100  \n",
       "                                                     2                   100  \n",
       "                                                     3                   100  \n",
       "                                                     4                   100  \n",
       "alibi_monotonic               False                  0                   100  \n",
       "                                                     1                   100  \n",
       "                                                     2                   100  \n",
       "                                                     3                   100  \n",
       "                                                     4                   100  \n",
       "alibi_monotonic_q_k           False                  0                   100  \n",
       "                                                     1                   100  \n",
       "                                                     2                   100  \n",
       "                                                     3                   100  \n",
       "                                                     4                   100  \n",
       "learnable_alibi_monotonic     False                  0                   100  \n",
       "                                                     1                   100  \n",
       "                                                     2                   100  \n",
       "                                                     3                   100  \n",
       "                                                     4                   100  \n",
       "learnable_alibi_monotonic_q_k False                  0                   100  \n",
       "                                                     1                   100  \n",
       "                                                     2                   100  \n",
       "                                                     3                   100  \n",
       "                                                     4                   100  \n",
       "                              True                   0                   100  \n",
       "                                                     1                   100  \n",
       "                                                     2                   100  \n",
       "                                                     3                   100  \n",
       "                                                     4                   100  \n",
       "standard                      False                  0                   100  \n",
       "                                                     1                   100  \n",
       "                                                     2                   100  \n",
       "                                                     3                   100  \n",
       "                                                     4                   100  "
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_sweep_groupby = df_sweep.groupby([\"model.attn_variant\", \"model.use_decoder_only\", \"data.val_fold_idx\"])[[\"val_auc\", \"val_accuracy\"]].agg([\"max\", \"mean\", \"std\", \"count\"])\n",
    "df_sweep_groupby"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/akt/0/85,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/akt/1/74,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/akt/2/18,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/akt/3/57,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/akt/4/91,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi/0/78,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi/1/28,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi/2/82,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi/3/21,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi/4/65,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi_q_k/0/75,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi_q_k/1/93,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi_q_k/2/81,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi_q_k/3/84,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/alibi_q_k/4/86,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic/0/98,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic/1/3,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic/2/82,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic/3/94,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic/4/65,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k/0/33,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k/1/96,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k/2/74,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k/3/95,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k/4/26,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k_dec_only/0/65,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k_dec_only/1/96,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k_dec_only/2/54,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k_dec_only/3/89,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/learnable_alibi_monotonic_q_k_dec_only/4/44,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/standard_pe/0/63,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/standard_pe/1/80,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/standard_pe/2/63,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/standard_pe/3/73,/home/knowledge-tracing/ktst/sweeps/ablation_assist2009/standard_pe/4/82\n"
     ]
    }
   ],
   "source": [
    "max_idx = df_sweep.groupby([\"model.attn_variant\", \"model.use_decoder_only\", \"data.val_fold_idx\"])[\"val_auc\"].idxmax()\n",
    "best_runs = df_sweep.iloc[max_idx]\n",
    "print(\",\".join(best_runs[\"run_dir\"].values))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "# reproduce train on same gpu\n",
    "df_train = summarize_outputs_in_df(outputs_dir=train_path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr:last-of-type th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">val_auc</th>\n",
       "      <th colspan=\"4\" halign=\"left\">val_accuracy</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>max</th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "      <th>count</th>\n",
       "      <th>max</th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "      <th>count</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>model.attn_variant</th>\n",
       "      <th>model.use_decoder_only</th>\n",
       "      <th>data.val_fold_idx</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">akt_monotonic</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.791687</td>\n",
       "      <td>0.791687</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.752263</td>\n",
       "      <td>0.752263</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.782070</td>\n",
       "      <td>0.782070</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.748402</td>\n",
       "      <td>0.748402</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.790056</td>\n",
       "      <td>0.790056</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.755062</td>\n",
       "      <td>0.755062</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.784018</td>\n",
       "      <td>0.784018</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.749684</td>\n",
       "      <td>0.749684</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.790017</td>\n",
       "      <td>0.790017</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.744718</td>\n",
       "      <td>0.744718</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">alibi_monotonic</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.790275</td>\n",
       "      <td>0.790275</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.750457</td>\n",
       "      <td>0.750457</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.780984</td>\n",
       "      <td>0.780984</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.746536</td>\n",
       "      <td>0.746536</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.790900</td>\n",
       "      <td>0.790900</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.754447</td>\n",
       "      <td>0.754447</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.781265</td>\n",
       "      <td>0.781265</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.744369</td>\n",
       "      <td>0.744369</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.788992</td>\n",
       "      <td>0.788992</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.743961</td>\n",
       "      <td>0.743961</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">alibi_monotonic_q_k</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.793804</td>\n",
       "      <td>0.793804</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.752657</td>\n",
       "      <td>0.752657</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.783544</td>\n",
       "      <td>0.783544</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.747082</td>\n",
       "      <td>0.747082</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.793501</td>\n",
       "      <td>0.793501</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.758160</td>\n",
       "      <td>0.758160</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.785331</td>\n",
       "      <td>0.785331</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.749082</td>\n",
       "      <td>0.749082</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.791253</td>\n",
       "      <td>0.791253</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.746945</td>\n",
       "      <td>0.746945</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">learnable_alibi_monotonic</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.793063</td>\n",
       "      <td>0.793063</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.751453</td>\n",
       "      <td>0.751453</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.781806</td>\n",
       "      <td>0.781806</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.745535</td>\n",
       "      <td>0.745535</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.791413</td>\n",
       "      <td>0.791413</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.757727</td>\n",
       "      <td>0.757727</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.783798</td>\n",
       "      <td>0.783798</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.748882</td>\n",
       "      <td>0.748882</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.789391</td>\n",
       "      <td>0.789391</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.744162</td>\n",
       "      <td>0.744162</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"10\" valign=\"top\">learnable_alibi_monotonic_q_k</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.794848</td>\n",
       "      <td>0.794848</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.753375</td>\n",
       "      <td>0.753375</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.784065</td>\n",
       "      <td>0.784065</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.747492</td>\n",
       "      <td>0.747492</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.793454</td>\n",
       "      <td>0.793454</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.758456</td>\n",
       "      <td>0.758456</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.785915</td>\n",
       "      <td>0.785915</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.749062</td>\n",
       "      <td>0.749062</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.791582</td>\n",
       "      <td>0.791582</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.747813</td>\n",
       "      <td>0.747813</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">True</th>\n",
       "      <th>0</th>\n",
       "      <td>0.793369</td>\n",
       "      <td>0.793369</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.751870</td>\n",
       "      <td>0.751870</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.783265</td>\n",
       "      <td>0.783265</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.746331</td>\n",
       "      <td>0.746331</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.792105</td>\n",
       "      <td>0.792105</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.756360</td>\n",
       "      <td>0.756360</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.784848</td>\n",
       "      <td>0.784848</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.748782</td>\n",
       "      <td>0.748782</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.790955</td>\n",
       "      <td>0.790955</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.744874</td>\n",
       "      <td>0.744874</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">standard</th>\n",
       "      <th rowspan=\"5\" valign=\"top\">False</th>\n",
       "      <th>0</th>\n",
       "      <td>0.770023</td>\n",
       "      <td>0.770023</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.735153</td>\n",
       "      <td>0.735153</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0.761767</td>\n",
       "      <td>0.761767</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.732727</td>\n",
       "      <td>0.732727</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.773836</td>\n",
       "      <td>0.773836</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.742535</td>\n",
       "      <td>0.742535</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.765727</td>\n",
       "      <td>0.765727</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.737851</td>\n",
       "      <td>0.737851</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.766297</td>\n",
       "      <td>0.766297</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>0.727576</td>\n",
       "      <td>0.727576</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                                         val_auc  \\\n",
       "                                                                             max   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx             \n",
       "akt_monotonic                 False                  0                  0.791687   \n",
       "                                                     1                  0.782070   \n",
       "                                                     2                  0.790056   \n",
       "                                                     3                  0.784018   \n",
       "                                                     4                  0.790017   \n",
       "alibi_monotonic               False                  0                  0.790275   \n",
       "                                                     1                  0.780984   \n",
       "                                                     2                  0.790900   \n",
       "                                                     3                  0.781265   \n",
       "                                                     4                  0.788992   \n",
       "alibi_monotonic_q_k           False                  0                  0.793804   \n",
       "                                                     1                  0.783544   \n",
       "                                                     2                  0.793501   \n",
       "                                                     3                  0.785331   \n",
       "                                                     4                  0.791253   \n",
       "learnable_alibi_monotonic     False                  0                  0.793063   \n",
       "                                                     1                  0.781806   \n",
       "                                                     2                  0.791413   \n",
       "                                                     3                  0.783798   \n",
       "                                                     4                  0.789391   \n",
       "learnable_alibi_monotonic_q_k False                  0                  0.794848   \n",
       "                                                     1                  0.784065   \n",
       "                                                     2                  0.793454   \n",
       "                                                     3                  0.785915   \n",
       "                                                     4                  0.791582   \n",
       "                              True                   0                  0.793369   \n",
       "                                                     1                  0.783265   \n",
       "                                                     2                  0.792105   \n",
       "                                                     3                  0.784848   \n",
       "                                                     4                  0.790955   \n",
       "standard                      False                  0                  0.770023   \n",
       "                                                     1                  0.761767   \n",
       "                                                     2                  0.773836   \n",
       "                                                     3                  0.765727   \n",
       "                                                     4                  0.766297   \n",
       "\n",
       "                                                                                  \\\n",
       "                                                                            mean   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx             \n",
       "akt_monotonic                 False                  0                  0.791687   \n",
       "                                                     1                  0.782070   \n",
       "                                                     2                  0.790056   \n",
       "                                                     3                  0.784018   \n",
       "                                                     4                  0.790017   \n",
       "alibi_monotonic               False                  0                  0.790275   \n",
       "                                                     1                  0.780984   \n",
       "                                                     2                  0.790900   \n",
       "                                                     3                  0.781265   \n",
       "                                                     4                  0.788992   \n",
       "alibi_monotonic_q_k           False                  0                  0.793804   \n",
       "                                                     1                  0.783544   \n",
       "                                                     2                  0.793501   \n",
       "                                                     3                  0.785331   \n",
       "                                                     4                  0.791253   \n",
       "learnable_alibi_monotonic     False                  0                  0.793063   \n",
       "                                                     1                  0.781806   \n",
       "                                                     2                  0.791413   \n",
       "                                                     3                  0.783798   \n",
       "                                                     4                  0.789391   \n",
       "learnable_alibi_monotonic_q_k False                  0                  0.794848   \n",
       "                                                     1                  0.784065   \n",
       "                                                     2                  0.793454   \n",
       "                                                     3                  0.785915   \n",
       "                                                     4                  0.791582   \n",
       "                              True                   0                  0.793369   \n",
       "                                                     1                  0.783265   \n",
       "                                                     2                  0.792105   \n",
       "                                                     3                  0.784848   \n",
       "                                                     4                  0.790955   \n",
       "standard                      False                  0                  0.770023   \n",
       "                                                     1                  0.761767   \n",
       "                                                     2                  0.773836   \n",
       "                                                     3                  0.765727   \n",
       "                                                     4                  0.766297   \n",
       "\n",
       "                                                                            \\\n",
       "                                                                       std   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx       \n",
       "akt_monotonic                 False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "alibi_monotonic               False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "alibi_monotonic_q_k           False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "learnable_alibi_monotonic     False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "learnable_alibi_monotonic_q_k False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "                              True                   0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "standard                      False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "\n",
       "                                                                              \\\n",
       "                                                                       count   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx         \n",
       "akt_monotonic                 False                  0                     1   \n",
       "                                                     1                     1   \n",
       "                                                     2                     1   \n",
       "                                                     3                     1   \n",
       "                                                     4                     1   \n",
       "alibi_monotonic               False                  0                     1   \n",
       "                                                     1                     1   \n",
       "                                                     2                     1   \n",
       "                                                     3                     1   \n",
       "                                                     4                     1   \n",
       "alibi_monotonic_q_k           False                  0                     1   \n",
       "                                                     1                     1   \n",
       "                                                     2                     1   \n",
       "                                                     3                     1   \n",
       "                                                     4                     1   \n",
       "learnable_alibi_monotonic     False                  0                     1   \n",
       "                                                     1                     1   \n",
       "                                                     2                     1   \n",
       "                                                     3                     1   \n",
       "                                                     4                     1   \n",
       "learnable_alibi_monotonic_q_k False                  0                     1   \n",
       "                                                     1                     1   \n",
       "                                                     2                     1   \n",
       "                                                     3                     1   \n",
       "                                                     4                     1   \n",
       "                              True                   0                     1   \n",
       "                                                     1                     1   \n",
       "                                                     2                     1   \n",
       "                                                     3                     1   \n",
       "                                                     4                     1   \n",
       "standard                      False                  0                     1   \n",
       "                                                     1                     1   \n",
       "                                                     2                     1   \n",
       "                                                     3                     1   \n",
       "                                                     4                     1   \n",
       "\n",
       "                                                                       val_accuracy  \\\n",
       "                                                                                max   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx                \n",
       "akt_monotonic                 False                  0                     0.752263   \n",
       "                                                     1                     0.748402   \n",
       "                                                     2                     0.755062   \n",
       "                                                     3                     0.749684   \n",
       "                                                     4                     0.744718   \n",
       "alibi_monotonic               False                  0                     0.750457   \n",
       "                                                     1                     0.746536   \n",
       "                                                     2                     0.754447   \n",
       "                                                     3                     0.744369   \n",
       "                                                     4                     0.743961   \n",
       "alibi_monotonic_q_k           False                  0                     0.752657   \n",
       "                                                     1                     0.747082   \n",
       "                                                     2                     0.758160   \n",
       "                                                     3                     0.749082   \n",
       "                                                     4                     0.746945   \n",
       "learnable_alibi_monotonic     False                  0                     0.751453   \n",
       "                                                     1                     0.745535   \n",
       "                                                     2                     0.757727   \n",
       "                                                     3                     0.748882   \n",
       "                                                     4                     0.744162   \n",
       "learnable_alibi_monotonic_q_k False                  0                     0.753375   \n",
       "                                                     1                     0.747492   \n",
       "                                                     2                     0.758456   \n",
       "                                                     3                     0.749062   \n",
       "                                                     4                     0.747813   \n",
       "                              True                   0                     0.751870   \n",
       "                                                     1                     0.746331   \n",
       "                                                     2                     0.756360   \n",
       "                                                     3                     0.748782   \n",
       "                                                     4                     0.744874   \n",
       "standard                      False                  0                     0.735153   \n",
       "                                                     1                     0.732727   \n",
       "                                                     2                     0.742535   \n",
       "                                                     3                     0.737851   \n",
       "                                                     4                     0.727576   \n",
       "\n",
       "                                                                                  \\\n",
       "                                                                            mean   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx             \n",
       "akt_monotonic                 False                  0                  0.752263   \n",
       "                                                     1                  0.748402   \n",
       "                                                     2                  0.755062   \n",
       "                                                     3                  0.749684   \n",
       "                                                     4                  0.744718   \n",
       "alibi_monotonic               False                  0                  0.750457   \n",
       "                                                     1                  0.746536   \n",
       "                                                     2                  0.754447   \n",
       "                                                     3                  0.744369   \n",
       "                                                     4                  0.743961   \n",
       "alibi_monotonic_q_k           False                  0                  0.752657   \n",
       "                                                     1                  0.747082   \n",
       "                                                     2                  0.758160   \n",
       "                                                     3                  0.749082   \n",
       "                                                     4                  0.746945   \n",
       "learnable_alibi_monotonic     False                  0                  0.751453   \n",
       "                                                     1                  0.745535   \n",
       "                                                     2                  0.757727   \n",
       "                                                     3                  0.748882   \n",
       "                                                     4                  0.744162   \n",
       "learnable_alibi_monotonic_q_k False                  0                  0.753375   \n",
       "                                                     1                  0.747492   \n",
       "                                                     2                  0.758456   \n",
       "                                                     3                  0.749062   \n",
       "                                                     4                  0.747813   \n",
       "                              True                   0                  0.751870   \n",
       "                                                     1                  0.746331   \n",
       "                                                     2                  0.756360   \n",
       "                                                     3                  0.748782   \n",
       "                                                     4                  0.744874   \n",
       "standard                      False                  0                  0.735153   \n",
       "                                                     1                  0.732727   \n",
       "                                                     2                  0.742535   \n",
       "                                                     3                  0.737851   \n",
       "                                                     4                  0.727576   \n",
       "\n",
       "                                                                            \\\n",
       "                                                                       std   \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx       \n",
       "akt_monotonic                 False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "alibi_monotonic               False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "alibi_monotonic_q_k           False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "learnable_alibi_monotonic     False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "learnable_alibi_monotonic_q_k False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "                              True                   0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "standard                      False                  0                 NaN   \n",
       "                                                     1                 NaN   \n",
       "                                                     2                 NaN   \n",
       "                                                     3                 NaN   \n",
       "                                                     4                 NaN   \n",
       "\n",
       "                                                                              \n",
       "                                                                       count  \n",
       "model.attn_variant            model.use_decoder_only data.val_fold_idx        \n",
       "akt_monotonic                 False                  0                     1  \n",
       "                                                     1                     1  \n",
       "                                                     2                     1  \n",
       "                                                     3                     1  \n",
       "                                                     4                     1  \n",
       "alibi_monotonic               False                  0                     1  \n",
       "                                                     1                     1  \n",
       "                                                     2                     1  \n",
       "                                                     3                     1  \n",
       "                                                     4                     1  \n",
       "alibi_monotonic_q_k           False                  0                     1  \n",
       "                                                     1                     1  \n",
       "                                                     2                     1  \n",
       "                                                     3                     1  \n",
       "                                                     4                     1  \n",
       "learnable_alibi_monotonic     False                  0                     1  \n",
       "                                                     1                     1  \n",
       "                                                     2                     1  \n",
       "                                                     3                     1  \n",
       "                                                     4                     1  \n",
       "learnable_alibi_monotonic_q_k False                  0                     1  \n",
       "                                                     1                     1  \n",
       "                                                     2                     1  \n",
       "                                                     3                     1  \n",
       "                                                     4                     1  \n",
       "                              True                   0                     1  \n",
       "                                                     1                     1  \n",
       "                                                     2                     1  \n",
       "                                                     3                     1  \n",
       "                                                     4                     1  \n",
       "standard                      False                  0                     1  \n",
       "                                                     1                     1  \n",
       "                                                     2                     1  \n",
       "                                                     3                     1  \n",
       "                                                     4                     1  "
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_train_groupby = df_train.groupby([\"model.attn_variant\", \"model.use_decoder_only\", \"data.val_fold_idx\"])[[\"val_auc\", \"val_accuracy\"]].agg([\"max\", \"mean\", \"std\", \"count\"])\n",
    "df_train_groupby"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "# test\n",
    "df_test = summarize_outputs_in_df(outputs_dir=test_path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr:last-of-type th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"3\" halign=\"left\">best_val_metric</th>\n",
       "      <th colspan=\"3\" halign=\"left\">test_auc</th>\n",
       "      <th colspan=\"3\" halign=\"left\">test_accuracy</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "      <th>count</th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "      <th>count</th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "      <th>count</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>model.attn_variant</th>\n",
       "      <th>model.use_decoder_only</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>akt_monotonic</th>\n",
       "      <th>False</th>\n",
       "      <td>0.787569</td>\n",
       "      <td>0.004242</td>\n",
       "      <td>5</td>\n",
       "      <td>0.795767</td>\n",
       "      <td>0.001217</td>\n",
       "      <td>5</td>\n",
       "      <td>0.746405</td>\n",
       "      <td>0.000997</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>alibi_monotonic</th>\n",
       "      <th>False</th>\n",
       "      <td>0.786483</td>\n",
       "      <td>0.004941</td>\n",
       "      <td>5</td>\n",
       "      <td>0.795310</td>\n",
       "      <td>0.002061</td>\n",
       "      <td>5</td>\n",
       "      <td>0.745603</td>\n",
       "      <td>0.002339</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>alibi_monotonic_q_k</th>\n",
       "      <th>False</th>\n",
       "      <td>0.789487</td>\n",
       "      <td>0.004756</td>\n",
       "      <td>5</td>\n",
       "      <td>0.797801</td>\n",
       "      <td>0.001120</td>\n",
       "      <td>5</td>\n",
       "      <td>0.747948</td>\n",
       "      <td>0.000814</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>learnable_alibi_monotonic</th>\n",
       "      <th>False</th>\n",
       "      <td>0.787894</td>\n",
       "      <td>0.004878</td>\n",
       "      <td>5</td>\n",
       "      <td>0.797590</td>\n",
       "      <td>0.001439</td>\n",
       "      <td>5</td>\n",
       "      <td>0.747623</td>\n",
       "      <td>0.001300</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">learnable_alibi_monotonic_q_k</th>\n",
       "      <th>False</th>\n",
       "      <td>0.789973</td>\n",
       "      <td>0.004739</td>\n",
       "      <td>5</td>\n",
       "      <td>0.799346</td>\n",
       "      <td>0.001368</td>\n",
       "      <td>5</td>\n",
       "      <td>0.749032</td>\n",
       "      <td>0.001444</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>True</th>\n",
       "      <td>0.788908</td>\n",
       "      <td>0.004545</td>\n",
       "      <td>5</td>\n",
       "      <td>0.797704</td>\n",
       "      <td>0.001215</td>\n",
       "      <td>5</td>\n",
       "      <td>0.747298</td>\n",
       "      <td>0.000784</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>standard</th>\n",
       "      <th>False</th>\n",
       "      <td>0.767530</td>\n",
       "      <td>0.004582</td>\n",
       "      <td>5</td>\n",
       "      <td>0.774404</td>\n",
       "      <td>0.001577</td>\n",
       "      <td>5</td>\n",
       "      <td>0.730734</td>\n",
       "      <td>0.001683</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                     best_val_metric  \\\n",
       "                                                                mean   \n",
       "model.attn_variant            model.use_decoder_only                   \n",
       "akt_monotonic                 False                         0.787569   \n",
       "alibi_monotonic               False                         0.786483   \n",
       "alibi_monotonic_q_k           False                         0.789487   \n",
       "learnable_alibi_monotonic     False                         0.787894   \n",
       "learnable_alibi_monotonic_q_k False                         0.789973   \n",
       "                              True                          0.788908   \n",
       "standard                      False                         0.767530   \n",
       "\n",
       "                                                                      \\\n",
       "                                                           std count   \n",
       "model.attn_variant            model.use_decoder_only                   \n",
       "akt_monotonic                 False                   0.004242     5   \n",
       "alibi_monotonic               False                   0.004941     5   \n",
       "alibi_monotonic_q_k           False                   0.004756     5   \n",
       "learnable_alibi_monotonic     False                   0.004878     5   \n",
       "learnable_alibi_monotonic_q_k False                   0.004739     5   \n",
       "                              True                    0.004545     5   \n",
       "standard                      False                   0.004582     5   \n",
       "\n",
       "                                                      test_auc            \\\n",
       "                                                          mean       std   \n",
       "model.attn_variant            model.use_decoder_only                       \n",
       "akt_monotonic                 False                   0.795767  0.001217   \n",
       "alibi_monotonic               False                   0.795310  0.002061   \n",
       "alibi_monotonic_q_k           False                   0.797801  0.001120   \n",
       "learnable_alibi_monotonic     False                   0.797590  0.001439   \n",
       "learnable_alibi_monotonic_q_k False                   0.799346  0.001368   \n",
       "                              True                    0.797704  0.001215   \n",
       "standard                      False                   0.774404  0.001577   \n",
       "\n",
       "                                                           test_accuracy  \\\n",
       "                                                     count          mean   \n",
       "model.attn_variant            model.use_decoder_only                       \n",
       "akt_monotonic                 False                      5      0.746405   \n",
       "alibi_monotonic               False                      5      0.745603   \n",
       "alibi_monotonic_q_k           False                      5      0.747948   \n",
       "learnable_alibi_monotonic     False                      5      0.747623   \n",
       "learnable_alibi_monotonic_q_k False                      5      0.749032   \n",
       "                              True                       5      0.747298   \n",
       "standard                      False                      5      0.730734   \n",
       "\n",
       "                                                                      \n",
       "                                                           std count  \n",
       "model.attn_variant            model.use_decoder_only                  \n",
       "akt_monotonic                 False                   0.000997     5  \n",
       "alibi_monotonic               False                   0.002339     5  \n",
       "alibi_monotonic_q_k           False                   0.000814     5  \n",
       "learnable_alibi_monotonic     False                   0.001300     5  \n",
       "learnable_alibi_monotonic_q_k False                   0.001444     5  \n",
       "                              True                    0.000784     5  \n",
       "standard                      False                   0.001683     5  "
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_test_results = df_test.groupby([\"model.attn_variant\", \"model.use_decoder_only\"])[[\"best_val_metric\", \"test_auc\", \"test_accuracy\"]].agg([\"mean\", \"std\", \"count\"])\n",
    "df_test_results"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "dev",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
