{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import os\n",
    "import json\n",
    "from convlab.base_models.t5.mdst.evaluate_qa import eval_slot_pairs_prediction"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Main Exp Table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "aug_types = [(0, 0.0), (2, 2.0), (5, 2.0)]#, (1, 0.1)]\n",
    "index_names = ['Single', 'Single+Concat', 'Single+ConcatRel']#, '90%Single+10%Multi']\n",
    "column_names = ['RSA', 'CDTA']\n",
    "datasets = ['sgd/group0', 'multiwoz21']\n",
    "models = ['T5DST', 'MinTL', 'SDPDST']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"8\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"8\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">CDTA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">CDTA</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">T5DST</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">MinTL</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">SDPDST</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                          sgd/group0                                      \\\n",
       "                                 RSA                                CDTA   \n",
       "                            domain_1 domain_2 domain_3 domain_4 domain_1   \n",
       "T5DST  Single           0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4        NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+Concat    0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4        NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+ConcatRel 0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4        NaN      NaN      NaN      NaN      NaN   \n",
       "MinTL  Single           0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4        NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+Concat    0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4        NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+ConcatRel 0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4        NaN      NaN      NaN      NaN      NaN   \n",
       "SDPDST Single           0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4        NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+Concat    0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4        NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+ConcatRel 0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4        NaN      NaN      NaN      NaN      NaN   \n",
       "\n",
       "                                                     multiwoz21           \\\n",
       "                                                            RSA            \n",
       "                          domain_2 domain_3 domain_4   domain_1 domain_2   \n",
       "T5DST  Single           0      NaN      NaN      NaN        NaN      NaN   \n",
       "                        4      NaN      NaN      NaN        NaN      NaN   \n",
       "       Single+Concat    0      NaN      NaN      NaN        NaN      NaN   \n",
       "                        4      NaN      NaN      NaN        NaN      NaN   \n",
       "       Single+ConcatRel 0      NaN      NaN      NaN        NaN      NaN   \n",
       "                        4      NaN      NaN      NaN        NaN      NaN   \n",
       "MinTL  Single           0      NaN      NaN      NaN        NaN      NaN   \n",
       "                        4      NaN      NaN      NaN        NaN      NaN   \n",
       "       Single+Concat    0      NaN      NaN      NaN        NaN      NaN   \n",
       "                        4      NaN      NaN      NaN        NaN      NaN   \n",
       "       Single+ConcatRel 0      NaN      NaN      NaN        NaN      NaN   \n",
       "                        4      NaN      NaN      NaN        NaN      NaN   \n",
       "SDPDST Single           0      NaN      NaN      NaN        NaN      NaN   \n",
       "                        4      NaN      NaN      NaN        NaN      NaN   \n",
       "       Single+Concat    0      NaN      NaN      NaN        NaN      NaN   \n",
       "                        4      NaN      NaN      NaN        NaN      NaN   \n",
       "       Single+ConcatRel 0      NaN      NaN      NaN        NaN      NaN   \n",
       "                        4      NaN      NaN      NaN        NaN      NaN   \n",
       "\n",
       "                                                                        \\\n",
       "                                                CDTA                     \n",
       "                          domain_3 domain_4 domain_1 domain_2 domain_3   \n",
       "T5DST  Single           0      NaN      NaN      NaN      NaN      NaN   \n",
       "                        4      NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+Concat    0      NaN      NaN      NaN      NaN      NaN   \n",
       "                        4      NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+ConcatRel 0      NaN      NaN      NaN      NaN      NaN   \n",
       "                        4      NaN      NaN      NaN      NaN      NaN   \n",
       "MinTL  Single           0      NaN      NaN      NaN      NaN      NaN   \n",
       "                        4      NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+Concat    0      NaN      NaN      NaN      NaN      NaN   \n",
       "                        4      NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+ConcatRel 0      NaN      NaN      NaN      NaN      NaN   \n",
       "                        4      NaN      NaN      NaN      NaN      NaN   \n",
       "SDPDST Single           0      NaN      NaN      NaN      NaN      NaN   \n",
       "                        4      NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+Concat    0      NaN      NaN      NaN      NaN      NaN   \n",
       "                        4      NaN      NaN      NaN      NaN      NaN   \n",
       "       Single+ConcatRel 0      NaN      NaN      NaN      NaN      NaN   \n",
       "                        4      NaN      NaN      NaN      NaN      NaN   \n",
       "\n",
       "                                    \n",
       "                                    \n",
       "                          domain_4  \n",
       "T5DST  Single           0      NaN  \n",
       "                        4      NaN  \n",
       "       Single+Concat    0      NaN  \n",
       "                        4      NaN  \n",
       "       Single+ConcatRel 0      NaN  \n",
       "                        4      NaN  \n",
       "MinTL  Single           0      NaN  \n",
       "                        4      NaN  \n",
       "       Single+Concat    0      NaN  \n",
       "                        4      NaN  \n",
       "       Single+ConcatRel 0      NaN  \n",
       "                        4      NaN  \n",
       "SDPDST Single           0      NaN  \n",
       "                        4      NaN  \n",
       "       Single+Concat    0      NaN  \n",
       "                        4      NaN  \n",
       "       Single+ConcatRel 0      NaN  \n",
       "                        4      NaN  "
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "main_exp_table = pd.DataFrame(index=pd.MultiIndex.from_product([models, index_names, [0, 4]]), \n",
    "                              columns=pd.MultiIndex.from_product([datasets, column_names, [f'domain_{i}' for i in range(1,5)]]))\n",
    "main_exp_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:18: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
      "/tmp/ipykernel_33250/1508128031.py:19: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
      "/tmp/ipykernel_33250/1508128031.py:21: PerformanceWarning: indexing past lexsort depth may impact performance.\n",
      "  table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n"
     ]
    }
   ],
   "source": [
    "table = main_exp_table\n",
    "for i, (aug_type, aug_times) in enumerate(aug_types):\n",
    "    index_name = index_names[i]\n",
    "    for j, model_name in zip([0,1,3], models):\n",
    "        for k in [j, j+4]:\n",
    "            c = 4 if k == 1 else 100\n",
    "            for dataset in datasets:\n",
    "                res_dir = f'output0615/{dataset}/qadst_f1_th>0.1/t5-large_aug{aug_type}_x{aug_times}_model{k}_context{c}'\n",
    "                \n",
    "                res_file = f'{res_dir}/test_multi_domain_result_ori_cdta.md'\n",
    "                if not os.path.exists(res_file):\n",
    "                    continue\n",
    "                df = pd.read_table(res_file, sep='|', index_col=1).dropna(axis=1, how='all').iloc[1:]\n",
    "                df = df.apply(lambda x: x.str.strip())\n",
    "                df = df.rename(columns=str.strip).rename(index=str.strip)\n",
    "\n",
    "                for dom_cnt in range(1, 5):\n",
    "                    table.loc[(model_name, index_name, k-j), (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
    "                    table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
    "                # table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'RSA']\n",
    "                table.loc[(model_name, index_name, k-j), (dataset, 'CDTA', f'domain_{1}')] = df.loc['all', 'CDTA']\n",
    "\n",
    "main_exp_table = main_exp_table.applymap(lambda x: round(pd.to_numeric(x, errors='coerce') * 100, 1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "main_exp_table = main_exp_table.drop(columns=[('multiwoz21', 'RSA', 'domain_4'),\n",
    "                                              ('multiwoz21', 'CDTA', 'domain_2'), \n",
    "                                              ('multiwoz21', 'CDTA', 'domain_3'), ('multiwoz21', 'CDTA', 'domain_4'),\n",
    "                                              ('sgd/group0', 'CDTA', 'domain_2'), \n",
    "                                              ('sgd/group0', 'CDTA', 'domain_3'), ('sgd/group0', 'CDTA', 'domain_4'),\n",
    "                                              ])\n",
    "# for i, (aug_type, aug_times) in enumerate(aug_types):\n",
    "#     index_name = index_names[i]\n",
    "#     main_exp_table = main_exp_table.drop(index=('MinTL', index_name, 4))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"5\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"4\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th colspan=\"3\" halign=\"left\">RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_1</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">T5DST</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>94.1</td>\n",
       "      <td>44.9</td>\n",
       "      <td>23.5</td>\n",
       "      <td>13.2</td>\n",
       "      <td>2.7</td>\n",
       "      <td>85.9</td>\n",
       "      <td>44.4</td>\n",
       "      <td>22.1</td>\n",
       "      <td>1.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.8</td>\n",
       "      <td>71.8</td>\n",
       "      <td>59.5</td>\n",
       "      <td>48.4</td>\n",
       "      <td>11.8</td>\n",
       "      <td>85.1</td>\n",
       "      <td>65.2</td>\n",
       "      <td>54.1</td>\n",
       "      <td>6.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>94.0</td>\n",
       "      <td>78.1</td>\n",
       "      <td>53.5</td>\n",
       "      <td>32.9</td>\n",
       "      <td>1.6</td>\n",
       "      <td>85.3</td>\n",
       "      <td>83.9</td>\n",
       "      <td>44.9</td>\n",
       "      <td>11.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.9</td>\n",
       "      <td>76.9</td>\n",
       "      <td>74.7</td>\n",
       "      <td>50.9</td>\n",
       "      <td>1.8</td>\n",
       "      <td>85.3</td>\n",
       "      <td>83.6</td>\n",
       "      <td>68.4</td>\n",
       "      <td>11.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>94.0</td>\n",
       "      <td>81.8</td>\n",
       "      <td>54.3</td>\n",
       "      <td>33.1</td>\n",
       "      <td>25.8</td>\n",
       "      <td>85.1</td>\n",
       "      <td>82.4</td>\n",
       "      <td>50.7</td>\n",
       "      <td>20.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.1</td>\n",
       "      <td>80.2</td>\n",
       "      <td>77.3</td>\n",
       "      <td>65.5</td>\n",
       "      <td>21.1</td>\n",
       "      <td>84.7</td>\n",
       "      <td>80.5</td>\n",
       "      <td>70.0</td>\n",
       "      <td>27.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">MinTL</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>92.3</td>\n",
       "      <td>47.4</td>\n",
       "      <td>29.8</td>\n",
       "      <td>12.9</td>\n",
       "      <td>2.1</td>\n",
       "      <td>83.0</td>\n",
       "      <td>52.7</td>\n",
       "      <td>37.2</td>\n",
       "      <td>1.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.5</td>\n",
       "      <td>64.3</td>\n",
       "      <td>56.2</td>\n",
       "      <td>37.0</td>\n",
       "      <td>0.8</td>\n",
       "      <td>83.9</td>\n",
       "      <td>59.3</td>\n",
       "      <td>44.4</td>\n",
       "      <td>1.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>92.8</td>\n",
       "      <td>70.0</td>\n",
       "      <td>67.8</td>\n",
       "      <td>54.3</td>\n",
       "      <td>1.1</td>\n",
       "      <td>84.2</td>\n",
       "      <td>81.5</td>\n",
       "      <td>64.0</td>\n",
       "      <td>5.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.4</td>\n",
       "      <td>74.4</td>\n",
       "      <td>72.2</td>\n",
       "      <td>58.3</td>\n",
       "      <td>0.5</td>\n",
       "      <td>84.4</td>\n",
       "      <td>82.0</td>\n",
       "      <td>65.1</td>\n",
       "      <td>7.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>91.7</td>\n",
       "      <td>70.2</td>\n",
       "      <td>64.0</td>\n",
       "      <td>54.5</td>\n",
       "      <td>18.2</td>\n",
       "      <td>83.5</td>\n",
       "      <td>80.0</td>\n",
       "      <td>66.3</td>\n",
       "      <td>27.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>92.9</td>\n",
       "      <td>78.0</td>\n",
       "      <td>73.4</td>\n",
       "      <td>62.9</td>\n",
       "      <td>21.8</td>\n",
       "      <td>83.6</td>\n",
       "      <td>80.4</td>\n",
       "      <td>66.3</td>\n",
       "      <td>29.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">SDPDST</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>93.6</td>\n",
       "      <td>59.0</td>\n",
       "      <td>44.7</td>\n",
       "      <td>47.7</td>\n",
       "      <td>3.8</td>\n",
       "      <td>86.2</td>\n",
       "      <td>58.0</td>\n",
       "      <td>39.8</td>\n",
       "      <td>1.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>94.7</td>\n",
       "      <td>74.7</td>\n",
       "      <td>66.2</td>\n",
       "      <td>54.6</td>\n",
       "      <td>13.2</td>\n",
       "      <td>86.2</td>\n",
       "      <td>66.9</td>\n",
       "      <td>54.0</td>\n",
       "      <td>8.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>93.3</td>\n",
       "      <td>81.9</td>\n",
       "      <td>79.5</td>\n",
       "      <td>66.6</td>\n",
       "      <td>0.8</td>\n",
       "      <td>87.2</td>\n",
       "      <td>84.9</td>\n",
       "      <td>68.5</td>\n",
       "      <td>9.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>95.0</td>\n",
       "      <td>78.3</td>\n",
       "      <td>77.5</td>\n",
       "      <td>58.7</td>\n",
       "      <td>1.7</td>\n",
       "      <td>86.6</td>\n",
       "      <td>84.3</td>\n",
       "      <td>68.1</td>\n",
       "      <td>8.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>92.6</td>\n",
       "      <td>83.4</td>\n",
       "      <td>80.1</td>\n",
       "      <td>74.6</td>\n",
       "      <td>18.1</td>\n",
       "      <td>86.9</td>\n",
       "      <td>83.8</td>\n",
       "      <td>72.4</td>\n",
       "      <td>26.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>94.8</td>\n",
       "      <td>81.9</td>\n",
       "      <td>78.4</td>\n",
       "      <td>66.4</td>\n",
       "      <td>19.7</td>\n",
       "      <td>86.2</td>\n",
       "      <td>82.6</td>\n",
       "      <td>70.6</td>\n",
       "      <td>27.7</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                          sgd/group0                                      \\\n",
       "                                 RSA                                CDTA   \n",
       "                            domain_1 domain_2 domain_3 domain_4 domain_1   \n",
       "T5DST  Single           0       94.1     44.9     23.5     13.2      2.7   \n",
       "                        4       93.8     71.8     59.5     48.4     11.8   \n",
       "       Single+Concat    0       94.0     78.1     53.5     32.9      1.6   \n",
       "                        4       93.9     76.9     74.7     50.9      1.8   \n",
       "       Single+ConcatRel 0       94.0     81.8     54.3     33.1     25.8   \n",
       "                        4       93.1     80.2     77.3     65.5     21.1   \n",
       "MinTL  Single           0       92.3     47.4     29.8     12.9      2.1   \n",
       "                        4       93.5     64.3     56.2     37.0      0.8   \n",
       "       Single+Concat    0       92.8     70.0     67.8     54.3      1.1   \n",
       "                        4       93.4     74.4     72.2     58.3      0.5   \n",
       "       Single+ConcatRel 0       91.7     70.2     64.0     54.5     18.2   \n",
       "                        4       92.9     78.0     73.4     62.9     21.8   \n",
       "SDPDST Single           0       93.6     59.0     44.7     47.7      3.8   \n",
       "                        4       94.7     74.7     66.2     54.6     13.2   \n",
       "       Single+Concat    0       93.3     81.9     79.5     66.6      0.8   \n",
       "                        4       95.0     78.3     77.5     58.7      1.7   \n",
       "       Single+ConcatRel 0       92.6     83.4     80.1     74.6     18.1   \n",
       "                        4       94.8     81.9     78.4     66.4     19.7   \n",
       "\n",
       "                          multiwoz21                             \n",
       "                                 RSA                       CDTA  \n",
       "                            domain_1 domain_2 domain_3 domain_1  \n",
       "T5DST  Single           0       85.9     44.4     22.1      1.6  \n",
       "                        4       85.1     65.2     54.1      6.6  \n",
       "       Single+Concat    0       85.3     83.9     44.9     11.2  \n",
       "                        4       85.3     83.6     68.4     11.1  \n",
       "       Single+ConcatRel 0       85.1     82.4     50.7     20.9  \n",
       "                        4       84.7     80.5     70.0     27.6  \n",
       "MinTL  Single           0       83.0     52.7     37.2      1.8  \n",
       "                        4       83.9     59.3     44.4      1.9  \n",
       "       Single+Concat    0       84.2     81.5     64.0      5.8  \n",
       "                        4       84.4     82.0     65.1      7.3  \n",
       "       Single+ConcatRel 0       83.5     80.0     66.3     27.5  \n",
       "                        4       83.6     80.4     66.3     29.1  \n",
       "SDPDST Single           0       86.2     58.0     39.8      1.4  \n",
       "                        4       86.2     66.9     54.0      8.5  \n",
       "       Single+Concat    0       87.2     84.9     68.5      9.1  \n",
       "                        4       86.6     84.3     68.1      8.3  \n",
       "       Single+ConcatRel 0       86.9     83.8     72.4     26.8  \n",
       "                        4       86.2     82.6     70.6     27.7  "
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "main_exp_table #0620 ori cdta"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"5\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"4\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th colspan=\"3\" halign=\"left\">RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_1</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">T5DST</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>94.1</td>\n",
       "      <td>44.9</td>\n",
       "      <td>23.5</td>\n",
       "      <td>13.2</td>\n",
       "      <td>4.9</td>\n",
       "      <td>85.9</td>\n",
       "      <td>44.4</td>\n",
       "      <td>22.1</td>\n",
       "      <td>4.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.8</td>\n",
       "      <td>71.8</td>\n",
       "      <td>59.5</td>\n",
       "      <td>48.4</td>\n",
       "      <td>15.8</td>\n",
       "      <td>85.1</td>\n",
       "      <td>65.2</td>\n",
       "      <td>54.1</td>\n",
       "      <td>18.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>94.0</td>\n",
       "      <td>78.1</td>\n",
       "      <td>53.5</td>\n",
       "      <td>32.9</td>\n",
       "      <td>5.5</td>\n",
       "      <td>85.3</td>\n",
       "      <td>83.9</td>\n",
       "      <td>44.9</td>\n",
       "      <td>32.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.9</td>\n",
       "      <td>76.9</td>\n",
       "      <td>74.7</td>\n",
       "      <td>50.9</td>\n",
       "      <td>8.8</td>\n",
       "      <td>85.3</td>\n",
       "      <td>83.6</td>\n",
       "      <td>68.4</td>\n",
       "      <td>37.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>94.0</td>\n",
       "      <td>81.8</td>\n",
       "      <td>54.3</td>\n",
       "      <td>33.1</td>\n",
       "      <td>29.0</td>\n",
       "      <td>85.1</td>\n",
       "      <td>82.4</td>\n",
       "      <td>50.7</td>\n",
       "      <td>35.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>92.9</td>\n",
       "      <td>81.3</td>\n",
       "      <td>77.0</td>\n",
       "      <td>66.7</td>\n",
       "      <td>31.0</td>\n",
       "      <td>84.8</td>\n",
       "      <td>81.8</td>\n",
       "      <td>70.4</td>\n",
       "      <td>45.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">MinTL</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>92.3</td>\n",
       "      <td>47.4</td>\n",
       "      <td>29.8</td>\n",
       "      <td>12.9</td>\n",
       "      <td>4.5</td>\n",
       "      <td>83.0</td>\n",
       "      <td>52.7</td>\n",
       "      <td>37.2</td>\n",
       "      <td>3.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.5</td>\n",
       "      <td>64.3</td>\n",
       "      <td>56.2</td>\n",
       "      <td>37.0</td>\n",
       "      <td>5.6</td>\n",
       "      <td>83.9</td>\n",
       "      <td>59.3</td>\n",
       "      <td>44.4</td>\n",
       "      <td>4.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>92.8</td>\n",
       "      <td>70.0</td>\n",
       "      <td>67.8</td>\n",
       "      <td>54.3</td>\n",
       "      <td>7.1</td>\n",
       "      <td>84.2</td>\n",
       "      <td>81.5</td>\n",
       "      <td>64.0</td>\n",
       "      <td>30.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.4</td>\n",
       "      <td>74.4</td>\n",
       "      <td>72.2</td>\n",
       "      <td>58.3</td>\n",
       "      <td>7.6</td>\n",
       "      <td>84.4</td>\n",
       "      <td>82.0</td>\n",
       "      <td>65.1</td>\n",
       "      <td>35.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>91.7</td>\n",
       "      <td>70.2</td>\n",
       "      <td>64.0</td>\n",
       "      <td>54.5</td>\n",
       "      <td>22.9</td>\n",
       "      <td>83.5</td>\n",
       "      <td>80.0</td>\n",
       "      <td>66.3</td>\n",
       "      <td>42.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>92.9</td>\n",
       "      <td>78.0</td>\n",
       "      <td>73.4</td>\n",
       "      <td>62.9</td>\n",
       "      <td>26.7</td>\n",
       "      <td>83.6</td>\n",
       "      <td>80.4</td>\n",
       "      <td>66.3</td>\n",
       "      <td>46.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">SDPDST</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>93.6</td>\n",
       "      <td>59.0</td>\n",
       "      <td>44.7</td>\n",
       "      <td>47.7</td>\n",
       "      <td>6.7</td>\n",
       "      <td>86.2</td>\n",
       "      <td>58.0</td>\n",
       "      <td>39.8</td>\n",
       "      <td>7.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>94.7</td>\n",
       "      <td>74.7</td>\n",
       "      <td>66.2</td>\n",
       "      <td>54.6</td>\n",
       "      <td>17.4</td>\n",
       "      <td>86.2</td>\n",
       "      <td>66.9</td>\n",
       "      <td>54.0</td>\n",
       "      <td>23.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>93.3</td>\n",
       "      <td>81.9</td>\n",
       "      <td>79.5</td>\n",
       "      <td>66.6</td>\n",
       "      <td>7.8</td>\n",
       "      <td>87.2</td>\n",
       "      <td>84.9</td>\n",
       "      <td>68.5</td>\n",
       "      <td>34.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>95.0</td>\n",
       "      <td>78.3</td>\n",
       "      <td>77.5</td>\n",
       "      <td>58.7</td>\n",
       "      <td>9.9</td>\n",
       "      <td>86.6</td>\n",
       "      <td>84.3</td>\n",
       "      <td>68.1</td>\n",
       "      <td>36.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>92.6</td>\n",
       "      <td>83.4</td>\n",
       "      <td>80.1</td>\n",
       "      <td>74.6</td>\n",
       "      <td>24.1</td>\n",
       "      <td>86.9</td>\n",
       "      <td>83.8</td>\n",
       "      <td>72.4</td>\n",
       "      <td>42.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>94.6</td>\n",
       "      <td>82.5</td>\n",
       "      <td>78.8</td>\n",
       "      <td>65.8</td>\n",
       "      <td>25.8</td>\n",
       "      <td>85.9</td>\n",
       "      <td>82.3</td>\n",
       "      <td>70.3</td>\n",
       "      <td>44.3</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                          sgd/group0                                      \\\n",
       "                                 RSA                                CDTA   \n",
       "                            domain_1 domain_2 domain_3 domain_4 domain_1   \n",
       "T5DST  Single           0       94.1     44.9     23.5     13.2      4.9   \n",
       "                        4       93.8     71.8     59.5     48.4     15.8   \n",
       "       Single+Concat    0       94.0     78.1     53.5     32.9      5.5   \n",
       "                        4       93.9     76.9     74.7     50.9      8.8   \n",
       "       Single+ConcatRel 0       94.0     81.8     54.3     33.1     29.0   \n",
       "                        4       92.9     81.3     77.0     66.7     31.0   \n",
       "MinTL  Single           0       92.3     47.4     29.8     12.9      4.5   \n",
       "                        4       93.5     64.3     56.2     37.0      5.6   \n",
       "       Single+Concat    0       92.8     70.0     67.8     54.3      7.1   \n",
       "                        4       93.4     74.4     72.2     58.3      7.6   \n",
       "       Single+ConcatRel 0       91.7     70.2     64.0     54.5     22.9   \n",
       "                        4       92.9     78.0     73.4     62.9     26.7   \n",
       "SDPDST Single           0       93.6     59.0     44.7     47.7      6.7   \n",
       "                        4       94.7     74.7     66.2     54.6     17.4   \n",
       "       Single+Concat    0       93.3     81.9     79.5     66.6      7.8   \n",
       "                        4       95.0     78.3     77.5     58.7      9.9   \n",
       "       Single+ConcatRel 0       92.6     83.4     80.1     74.6     24.1   \n",
       "                        4       94.6     82.5     78.8     65.8     25.8   \n",
       "\n",
       "                          multiwoz21                             \n",
       "                                 RSA                       CDTA  \n",
       "                            domain_1 domain_2 domain_3 domain_1  \n",
       "T5DST  Single           0       85.9     44.4     22.1      4.1  \n",
       "                        4       85.1     65.2     54.1     18.4  \n",
       "       Single+Concat    0       85.3     83.9     44.9     32.4  \n",
       "                        4       85.3     83.6     68.4     37.3  \n",
       "       Single+ConcatRel 0       85.1     82.4     50.7     35.4  \n",
       "                        4       84.8     81.8     70.4     45.5  \n",
       "MinTL  Single           0       83.0     52.7     37.2      3.2  \n",
       "                        4       83.9     59.3     44.4      4.7  \n",
       "       Single+Concat    0       84.2     81.5     64.0     30.9  \n",
       "                        4       84.4     82.0     65.1     35.6  \n",
       "       Single+ConcatRel 0       83.5     80.0     66.3     42.0  \n",
       "                        4       83.6     80.4     66.3     46.4  \n",
       "SDPDST Single           0       86.2     58.0     39.8      7.6  \n",
       "                        4       86.2     66.9     54.0     23.0  \n",
       "       Single+Concat    0       87.2     84.9     68.5     34.7  \n",
       "                        4       86.6     84.3     68.1     36.2  \n",
       "       Single+ConcatRel 0       86.9     83.8     72.4     42.5  \n",
       "                        4       85.9     82.3     70.3     44.3  "
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "main_exp_table #0617 fix empty value bug"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 73,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"5\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"5\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "      <th>domain_1</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">MinTL</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>93.5</td>\n",
       "      <td>49.3</td>\n",
       "      <td>30.5</td>\n",
       "      <td>26.9</td>\n",
       "      <td>4.0</td>\n",
       "      <td>83.2</td>\n",
       "      <td>52.4</td>\n",
       "      <td>38.2</td>\n",
       "      <td>28.3</td>\n",
       "      <td>2.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.3</td>\n",
       "      <td>63.0</td>\n",
       "      <td>53.4</td>\n",
       "      <td>27.8</td>\n",
       "      <td>5.1</td>\n",
       "      <td>84.7</td>\n",
       "      <td>58.2</td>\n",
       "      <td>42.5</td>\n",
       "      <td>38.3</td>\n",
       "      <td>3.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>93.1</td>\n",
       "      <td>69.6</td>\n",
       "      <td>66.2</td>\n",
       "      <td>53.6</td>\n",
       "      <td>7.5</td>\n",
       "      <td>84.6</td>\n",
       "      <td>82.0</td>\n",
       "      <td>64.6</td>\n",
       "      <td>74.3</td>\n",
       "      <td>32.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.2</td>\n",
       "      <td>74.1</td>\n",
       "      <td>72.4</td>\n",
       "      <td>58.1</td>\n",
       "      <td>7.3</td>\n",
       "      <td>84.4</td>\n",
       "      <td>82.3</td>\n",
       "      <td>66.0</td>\n",
       "      <td>83.0</td>\n",
       "      <td>36.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>92.5</td>\n",
       "      <td>69.8</td>\n",
       "      <td>64.2</td>\n",
       "      <td>52.5</td>\n",
       "      <td>19.2</td>\n",
       "      <td>83.5</td>\n",
       "      <td>80.2</td>\n",
       "      <td>66.2</td>\n",
       "      <td>63.6</td>\n",
       "      <td>43.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>92.8</td>\n",
       "      <td>78.3</td>\n",
       "      <td>73.6</td>\n",
       "      <td>61.2</td>\n",
       "      <td>26.5</td>\n",
       "      <td>83.9</td>\n",
       "      <td>80.3</td>\n",
       "      <td>67.1</td>\n",
       "      <td>74.4</td>\n",
       "      <td>45.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">T5DST</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>94.1</td>\n",
       "      <td>44.9</td>\n",
       "      <td>23.5</td>\n",
       "      <td>13.2</td>\n",
       "      <td>4.9</td>\n",
       "      <td>85.9</td>\n",
       "      <td>44.4</td>\n",
       "      <td>22.1</td>\n",
       "      <td>15.7</td>\n",
       "      <td>4.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.8</td>\n",
       "      <td>71.8</td>\n",
       "      <td>59.5</td>\n",
       "      <td>48.4</td>\n",
       "      <td>15.8</td>\n",
       "      <td>85.1</td>\n",
       "      <td>65.2</td>\n",
       "      <td>54.1</td>\n",
       "      <td>51.9</td>\n",
       "      <td>18.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>94.0</td>\n",
       "      <td>78.1</td>\n",
       "      <td>53.5</td>\n",
       "      <td>32.9</td>\n",
       "      <td>5.5</td>\n",
       "      <td>85.3</td>\n",
       "      <td>83.9</td>\n",
       "      <td>44.9</td>\n",
       "      <td>38.5</td>\n",
       "      <td>32.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>93.9</td>\n",
       "      <td>76.9</td>\n",
       "      <td>74.7</td>\n",
       "      <td>50.9</td>\n",
       "      <td>8.8</td>\n",
       "      <td>85.3</td>\n",
       "      <td>83.6</td>\n",
       "      <td>68.4</td>\n",
       "      <td>77.6</td>\n",
       "      <td>37.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>94.0</td>\n",
       "      <td>81.8</td>\n",
       "      <td>54.3</td>\n",
       "      <td>33.1</td>\n",
       "      <td>29.0</td>\n",
       "      <td>85.1</td>\n",
       "      <td>82.4</td>\n",
       "      <td>50.7</td>\n",
       "      <td>29.3</td>\n",
       "      <td>35.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>92.9</td>\n",
       "      <td>81.3</td>\n",
       "      <td>77.0</td>\n",
       "      <td>66.7</td>\n",
       "      <td>31.0</td>\n",
       "      <td>84.8</td>\n",
       "      <td>81.8</td>\n",
       "      <td>70.4</td>\n",
       "      <td>81.4</td>\n",
       "      <td>45.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">SDPDST</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single</th>\n",
       "      <th>0</th>\n",
       "      <td>93.6</td>\n",
       "      <td>59.0</td>\n",
       "      <td>44.7</td>\n",
       "      <td>47.7</td>\n",
       "      <td>6.7</td>\n",
       "      <td>86.2</td>\n",
       "      <td>58.0</td>\n",
       "      <td>39.8</td>\n",
       "      <td>25.6</td>\n",
       "      <td>7.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>94.7</td>\n",
       "      <td>74.7</td>\n",
       "      <td>66.2</td>\n",
       "      <td>54.6</td>\n",
       "      <td>17.4</td>\n",
       "      <td>86.2</td>\n",
       "      <td>66.9</td>\n",
       "      <td>54.0</td>\n",
       "      <td>61.9</td>\n",
       "      <td>23.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+Concat</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>87.2</td>\n",
       "      <td>84.9</td>\n",
       "      <td>68.5</td>\n",
       "      <td>74.0</td>\n",
       "      <td>34.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>95.0</td>\n",
       "      <td>78.3</td>\n",
       "      <td>77.5</td>\n",
       "      <td>58.7</td>\n",
       "      <td>9.9</td>\n",
       "      <td>86.6</td>\n",
       "      <td>84.3</td>\n",
       "      <td>68.1</td>\n",
       "      <td>83.0</td>\n",
       "      <td>36.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Single+ConcatRel</th>\n",
       "      <th>0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>87.3</td>\n",
       "      <td>83.5</td>\n",
       "      <td>70.7</td>\n",
       "      <td>73.6</td>\n",
       "      <td>41.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>94.3</td>\n",
       "      <td>81.9</td>\n",
       "      <td>79.3</td>\n",
       "      <td>69.5</td>\n",
       "      <td>25.4</td>\n",
       "      <td>86.2</td>\n",
       "      <td>82.4</td>\n",
       "      <td>67.7</td>\n",
       "      <td>74.7</td>\n",
       "      <td>43.9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                          sgd/group0                                      \\\n",
       "                                 RSA                                CDTA   \n",
       "                            domain_1 domain_2 domain_3 domain_4 domain_1   \n",
       "MinTL  Single           0       93.5     49.3     30.5     26.9      4.0   \n",
       "                        4       93.3     63.0     53.4     27.8      5.1   \n",
       "       Single+Concat    0       93.1     69.6     66.2     53.6      7.5   \n",
       "                        4       93.2     74.1     72.4     58.1      7.3   \n",
       "       Single+ConcatRel 0       92.5     69.8     64.2     52.5     19.2   \n",
       "                        4       92.8     78.3     73.6     61.2     26.5   \n",
       "T5DST  Single           0       94.1     44.9     23.5     13.2      4.9   \n",
       "                        4       93.8     71.8     59.5     48.4     15.8   \n",
       "       Single+Concat    0       94.0     78.1     53.5     32.9      5.5   \n",
       "                        4       93.9     76.9     74.7     50.9      8.8   \n",
       "       Single+ConcatRel 0       94.0     81.8     54.3     33.1     29.0   \n",
       "                        4       92.9     81.3     77.0     66.7     31.0   \n",
       "SDPDST Single           0       93.6     59.0     44.7     47.7      6.7   \n",
       "                        4       94.7     74.7     66.2     54.6     17.4   \n",
       "       Single+Concat    0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4       95.0     78.3     77.5     58.7      9.9   \n",
       "       Single+ConcatRel 0        NaN      NaN      NaN      NaN      NaN   \n",
       "                        4       94.3     81.9     79.3     69.5     25.4   \n",
       "\n",
       "                          multiwoz21                                      \n",
       "                                 RSA                                CDTA  \n",
       "                            domain_1 domain_2 domain_3 domain_4 domain_1  \n",
       "MinTL  Single           0       83.2     52.4     38.2     28.3      2.5  \n",
       "                        4       84.7     58.2     42.5     38.3      3.3  \n",
       "       Single+Concat    0       84.6     82.0     64.6     74.3     32.7  \n",
       "                        4       84.4     82.3     66.0     83.0     36.3  \n",
       "       Single+ConcatRel 0       83.5     80.2     66.2     63.6     43.7  \n",
       "                        4       83.9     80.3     67.1     74.4     45.2  \n",
       "T5DST  Single           0       85.9     44.4     22.1     15.7      4.1  \n",
       "                        4       85.1     65.2     54.1     51.9     18.4  \n",
       "       Single+Concat    0       85.3     83.9     44.9     38.5     32.4  \n",
       "                        4       85.3     83.6     68.4     77.6     37.3  \n",
       "       Single+ConcatRel 0       85.1     82.4     50.7     29.3     35.4  \n",
       "                        4       84.8     81.8     70.4     81.4     45.5  \n",
       "SDPDST Single           0       86.2     58.0     39.8     25.6      7.6  \n",
       "                        4       86.2     66.9     54.0     61.9     23.0  \n",
       "       Single+Concat    0       87.2     84.9     68.5     74.0     34.7  \n",
       "                        4       86.6     84.3     68.1     83.0     36.2  \n",
       "       Single+ConcatRel 0       87.3     83.5     70.7     73.6     41.7  \n",
       "                        4       86.2     82.4     67.7     74.7     43.9  "
      ]
     },
     "execution_count": 73,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "main_exp_table #0615"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lllrrrrrrrrr}\n",
      "\\toprule\n",
      "       &                  &   & \\multicolumn{5}{l}{sgd/group0} & \\multicolumn{4}{l}{multiwoz21} \\\\\n",
      "       &                  &   & \\multicolumn{4}{l}{RSA} &     CDTA & \\multicolumn{3}{l}{RSA} &     CDTA \\\\\n",
      "       &                  &   &   domain\\_1 & domain\\_2 & domain\\_3 & domain\\_4 & domain\\_1 &   domain\\_1 & domain\\_2 & domain\\_3 & domain\\_1 \\\\\n",
      "\\midrule\n",
      "T5DST & Single & 0 &       94.1 &     44.9 &     23.5 &     13.2 &      2.7 &       85.9 &     44.4 &     22.1 &      1.6 \\\\\n",
      "       &                  & 4 &       93.8 &     71.8 &     59.5 &     48.4 &     11.8 &       85.1 &     65.2 &     54.1 &      6.6 \\\\\n",
      "       & Single+Concat & 0 &       94.0 &     78.1 &     53.5 &     32.9 &      1.6 &       85.3 &     83.9 &     44.9 &     11.2 \\\\\n",
      "       &                  & 4 &       93.9 &     76.9 &     74.7 &     50.9 &      1.8 &       85.3 &     83.6 &     68.4 &     11.1 \\\\\n",
      "       & Single+ConcatRel & 0 &       94.0 &     81.8 &     54.3 &     33.1 &     25.8 &       85.1 &     82.4 &     50.7 &     20.9 \\\\\n",
      "       &                  & 4 &       92.9 &     81.3 &     77.0 &     66.7 &     26.9 &       84.8 &     81.8 &     70.4 &     30.8 \\\\\n",
      "MinTL & Single & 0 &       92.3 &     47.4 &     29.8 &     12.9 &      2.1 &       83.0 &     52.7 &     37.2 &      1.8 \\\\\n",
      "       &                  & 4 &       93.5 &     64.3 &     56.2 &     37.0 &      0.8 &       83.9 &     59.3 &     44.4 &      1.9 \\\\\n",
      "       & Single+Concat & 0 &       92.8 &     70.0 &     67.8 &     54.3 &      1.1 &       84.2 &     81.5 &     64.0 &      5.8 \\\\\n",
      "       &                  & 4 &       93.4 &     74.4 &     72.2 &     58.3 &      0.5 &       84.4 &     82.0 &     65.1 &      7.3 \\\\\n",
      "       & Single+ConcatRel & 0 &       91.7 &     70.2 &     64.0 &     54.5 &     18.2 &       83.5 &     80.0 &     66.3 &     27.5 \\\\\n",
      "       &                  & 4 &       92.9 &     78.0 &     73.4 &     62.9 &     21.8 &       83.6 &     80.4 &     66.3 &     29.1 \\\\\n",
      "SDPDST & Single & 0 &       93.6 &     59.0 &     44.7 &     47.7 &      3.8 &       86.2 &     58.0 &     39.8 &      1.4 \\\\\n",
      "       &                  & 4 &       94.7 &     74.7 &     66.2 &     54.6 &     13.2 &       86.2 &     66.9 &     54.0 &      8.5 \\\\\n",
      "       & Single+Concat & 0 &       93.3 &     81.9 &     79.5 &     66.6 &      0.8 &       87.2 &     84.9 &     68.5 &      9.1 \\\\\n",
      "       &                  & 4 &       95.0 &     78.3 &     77.5 &     58.7 &      1.7 &       86.6 &     84.3 &     68.1 &      8.3 \\\\\n",
      "       & Single+ConcatRel & 0 &       92.6 &     83.4 &     80.1 &     74.6 &     18.1 &       86.9 &     83.8 &     72.4 &     26.8 \\\\\n",
      "       &                  & 4 &       96.0 &     85.8 &     81.2 &     68.8 &     22.3 &       87.3 &     83.5 &     71.3 &     26.3 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_50930/1754652341.py:1: FutureWarning: In future versions `DataFrame.to_latex` is expected to utilise the base implementation of `Styler.to_latex` for formatting and rendering. The arguments signature may therefore change. It is recommended instead to use `DataFrame.style.to_latex` which also contains additional functionality.\n",
      "  print(main_exp_table.to_latex())\n"
     ]
    }
   ],
   "source": [
    "print(main_exp_table.to_latex())"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Domain expand"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">CDTA</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>sgd10</th>\n",
       "      <th>sgd15</th>\n",
       "      <th>sgd19</th>\n",
       "      <th>all</th>\n",
       "      <th>sgd10</th>\n",
       "      <th>sgd15</th>\n",
       "      <th>sgd19</th>\n",
       "      <th>all</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">0</th>\n",
       "      <th>10SYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15SYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>SYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">4</th>\n",
       "      <th>10SYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15SYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>SYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "          RSA                   CDTA                 \n",
       "        sgd10 sgd15 sgd19  all sgd10 sgd15 sgd19  all\n",
       "0 10SYN   NaN   NaN   NaN  NaN   NaN   NaN   NaN  NaN\n",
       "  15SYN   NaN   NaN   NaN  NaN   NaN   NaN   NaN  NaN\n",
       "  SYN     NaN   NaN   NaN  NaN   NaN   NaN   NaN  NaN\n",
       "4 10SYN   NaN   NaN   NaN  NaN   NaN   NaN   NaN  NaN\n",
       "  15SYN   NaN   NaN   NaN  NaN   NaN   NaN   NaN  NaN\n",
       "  SYN     NaN   NaN   NaN  NaN   NaN   NaN   NaN  NaN"
      ]
     },
     "execution_count": 21,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "aug_types = [(18, 2.0), (19, 2.0), (5, 2.0), (14, 2.0), (15, 2.0), (1, 0.1)][:3]\n",
    "index_names = ['10SYN', '15SYN', 'SYN', '10TURE', '15TRUE', '19TRUE'][:3]\n",
    "datasets = ['sgd/group0']\n",
    "models = ['T5DST']\n",
    "domain_expand_table = pd.DataFrame(index=pd.MultiIndex.from_product([[0, 4], index_names]), \n",
    "                                   columns=pd.MultiIndex.from_product([['RSA', 'CDTA'], ['sgd10', 'sgd15', 'sgd19', 'all']]))\n",
    "domain_expand_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "table = domain_expand_table\n",
    "for i, (aug_type, aug_times) in enumerate(aug_types):\n",
    "    index_name = index_names[i]\n",
    "    for j, model_name in zip([0,1,3], models):\n",
    "        for k in [j, j+4]:\n",
    "            c = 4 if k == 1 else 100\n",
    "            for dataset in datasets:\n",
    "                res_dir = f'output0615/{dataset}/qadst_f1_th>0.1/t5-large_aug{aug_type}_x{aug_times}_model{k}_context{c}'\n",
    "                \n",
    "                res_file = f'{res_dir}/test_multi_domain_result_ori_cdta.md'\n",
    "                if not os.path.exists(res_file):\n",
    "                    continue\n",
    "                df = pd.read_table(res_file, sep='|', index_col=1).dropna(axis=1, how='all').iloc[1:]\n",
    "                df = df.apply(lambda x: x.str.strip())\n",
    "                df = df.rename(columns=str.strip).rename(index=str.strip)\n",
    "\n",
    "                for group in ['sgd10', 'sgd15', 'sgd19', 'all']:\n",
    "                    table.loc[(k-j, index_name), ('RSA', group)] = df.loc[group, 'RSA']\n",
    "                    table.loc[(k-j, index_name), ('CDTA', group)] = df.loc[group, 'CDTA']\n",
    "\n",
    "domain_expand_table = domain_expand_table.applymap(lambda x: round(pd.to_numeric(x, errors='coerce') * 100, 1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">CDTA</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>sgd10</th>\n",
       "      <th>sgd15</th>\n",
       "      <th>sgd19</th>\n",
       "      <th>all</th>\n",
       "      <th>sgd10</th>\n",
       "      <th>sgd15</th>\n",
       "      <th>sgd19</th>\n",
       "      <th>all</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">0</th>\n",
       "      <th>10SYN</th>\n",
       "      <td>83.4</td>\n",
       "      <td>80.4</td>\n",
       "      <td>74.7</td>\n",
       "      <td>77.7</td>\n",
       "      <td>30.6</td>\n",
       "      <td>17.0</td>\n",
       "      <td>14.5</td>\n",
       "      <td>17.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15SYN</th>\n",
       "      <td>83.1</td>\n",
       "      <td>85.1</td>\n",
       "      <td>76.3</td>\n",
       "      <td>79.9</td>\n",
       "      <td>44.2</td>\n",
       "      <td>23.9</td>\n",
       "      <td>19.9</td>\n",
       "      <td>24.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>SYN</th>\n",
       "      <td>81.3</td>\n",
       "      <td>84.8</td>\n",
       "      <td>81.6</td>\n",
       "      <td>82.5</td>\n",
       "      <td>33.5</td>\n",
       "      <td>27.2</td>\n",
       "      <td>23.6</td>\n",
       "      <td>25.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">4</th>\n",
       "      <th>10SYN</th>\n",
       "      <td>87.0</td>\n",
       "      <td>84.1</td>\n",
       "      <td>82.1</td>\n",
       "      <td>83.5</td>\n",
       "      <td>38.0</td>\n",
       "      <td>27.7</td>\n",
       "      <td>21.0</td>\n",
       "      <td>24.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15SYN</th>\n",
       "      <td>85.3</td>\n",
       "      <td>85.5</td>\n",
       "      <td>83.0</td>\n",
       "      <td>84.1</td>\n",
       "      <td>32.2</td>\n",
       "      <td>27.4</td>\n",
       "      <td>20.4</td>\n",
       "      <td>23.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>SYN</th>\n",
       "      <td>87.5</td>\n",
       "      <td>85.6</td>\n",
       "      <td>83.7</td>\n",
       "      <td>84.8</td>\n",
       "      <td>38.4</td>\n",
       "      <td>27.2</td>\n",
       "      <td>24.3</td>\n",
       "      <td>26.9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "          RSA                    CDTA                  \n",
       "        sgd10 sgd15 sgd19   all sgd10 sgd15 sgd19   all\n",
       "0 10SYN  83.4  80.4  74.7  77.7  30.6  17.0  14.5  17.2\n",
       "  15SYN  83.1  85.1  76.3  79.9  44.2  23.9  19.9  24.1\n",
       "  SYN    81.3  84.8  81.6  82.5  33.5  27.2  23.6  25.8\n",
       "4 10SYN  87.0  84.1  82.1  83.5  38.0  27.7  21.0  24.8\n",
       "  15SYN  85.3  85.5  83.0  84.1  32.2  27.4  20.4  23.7\n",
       "  SYN    87.5  85.6  83.7  84.8  38.4  27.2  24.3  26.9"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "domain_expand_table # 0620"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 126,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">CDTA</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>sgd10</th>\n",
       "      <th>sgd15</th>\n",
       "      <th>sgd19</th>\n",
       "      <th>all</th>\n",
       "      <th>sgd10</th>\n",
       "      <th>sgd15</th>\n",
       "      <th>sgd19</th>\n",
       "      <th>all</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">0</th>\n",
       "      <th>10SYN</th>\n",
       "      <td>83.4</td>\n",
       "      <td>80.4</td>\n",
       "      <td>74.7</td>\n",
       "      <td>77.7</td>\n",
       "      <td>29.4</td>\n",
       "      <td>21.0</td>\n",
       "      <td>16.6</td>\n",
       "      <td>19.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15SYN</th>\n",
       "      <td>83.1</td>\n",
       "      <td>85.1</td>\n",
       "      <td>76.3</td>\n",
       "      <td>79.9</td>\n",
       "      <td>39.2</td>\n",
       "      <td>30.2</td>\n",
       "      <td>22.0</td>\n",
       "      <td>26.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>SYN</th>\n",
       "      <td>81.3</td>\n",
       "      <td>84.8</td>\n",
       "      <td>81.6</td>\n",
       "      <td>82.5</td>\n",
       "      <td>32.0</td>\n",
       "      <td>34.9</td>\n",
       "      <td>26.5</td>\n",
       "      <td>29.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">4</th>\n",
       "      <th>10SYN</th>\n",
       "      <td>87.0</td>\n",
       "      <td>84.1</td>\n",
       "      <td>82.1</td>\n",
       "      <td>83.5</td>\n",
       "      <td>41.2</td>\n",
       "      <td>35.1</td>\n",
       "      <td>24.5</td>\n",
       "      <td>29.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15SYN</th>\n",
       "      <td>85.3</td>\n",
       "      <td>85.5</td>\n",
       "      <td>83.0</td>\n",
       "      <td>84.1</td>\n",
       "      <td>37.8</td>\n",
       "      <td>35.6</td>\n",
       "      <td>24.1</td>\n",
       "      <td>28.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>SYN</th>\n",
       "      <td>87.5</td>\n",
       "      <td>85.6</td>\n",
       "      <td>83.7</td>\n",
       "      <td>84.8</td>\n",
       "      <td>42.4</td>\n",
       "      <td>34.6</td>\n",
       "      <td>27.0</td>\n",
       "      <td>31.0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "          RSA                    CDTA                  \n",
       "        sgd10 sgd15 sgd19   all sgd10 sgd15 sgd19   all\n",
       "0 10SYN  83.4  80.4  74.7  77.7  29.4  21.0  16.6  19.6\n",
       "  15SYN  83.1  85.1  76.3  79.9  39.2  30.2  22.0  26.4\n",
       "  SYN    81.3  84.8  81.6  82.5  32.0  34.9  26.5  29.0\n",
       "4 10SYN  87.0  84.1  82.1  83.5  41.2  35.1  24.5  29.3\n",
       "  15SYN  85.3  85.5  83.0  84.1  37.8  35.6  24.1  28.6\n",
       "  SYN    87.5  85.6  83.7  84.8  42.4  34.6  27.0  31.0"
      ]
     },
     "execution_count": 126,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# domain_expand_table = domain_expand_table.drop(columns=['CDTA'])\n",
    "domain_expand_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 123,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">CDTA</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>sgd10</th>\n",
       "      <th>sgd15</th>\n",
       "      <th>sgd19</th>\n",
       "      <th>all</th>\n",
       "      <th>sgd10</th>\n",
       "      <th>sgd15</th>\n",
       "      <th>sgd19</th>\n",
       "      <th>all</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"4\" valign=\"top\">0</th>\n",
       "      <th>SYN</th>\n",
       "      <td>81.3</td>\n",
       "      <td>84.8</td>\n",
       "      <td>81.6</td>\n",
       "      <td>82.5</td>\n",
       "      <td>32.0</td>\n",
       "      <td>34.9</td>\n",
       "      <td>26.5</td>\n",
       "      <td>29.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10TURE</th>\n",
       "      <td>92.3</td>\n",
       "      <td>68.1</td>\n",
       "      <td>60.9</td>\n",
       "      <td>68.0</td>\n",
       "      <td>70.0</td>\n",
       "      <td>7.8</td>\n",
       "      <td>3.8</td>\n",
       "      <td>15.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15TRUE</th>\n",
       "      <td>89.5</td>\n",
       "      <td>87.9</td>\n",
       "      <td>69.8</td>\n",
       "      <td>78.2</td>\n",
       "      <td>57.1</td>\n",
       "      <td>50.7</td>\n",
       "      <td>9.4</td>\n",
       "      <td>25.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19TRUE</th>\n",
       "      <td>82.5</td>\n",
       "      <td>87.4</td>\n",
       "      <td>87.0</td>\n",
       "      <td>86.4</td>\n",
       "      <td>62.8</td>\n",
       "      <td>57.6</td>\n",
       "      <td>45.9</td>\n",
       "      <td>50.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"4\" valign=\"top\">4</th>\n",
       "      <th>SYN</th>\n",
       "      <td>87.5</td>\n",
       "      <td>85.6</td>\n",
       "      <td>83.7</td>\n",
       "      <td>84.8</td>\n",
       "      <td>42.4</td>\n",
       "      <td>34.6</td>\n",
       "      <td>27.0</td>\n",
       "      <td>31.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10TURE</th>\n",
       "      <td>92.3</td>\n",
       "      <td>85.5</td>\n",
       "      <td>85.1</td>\n",
       "      <td>86.4</td>\n",
       "      <td>78.4</td>\n",
       "      <td>28.0</td>\n",
       "      <td>25.3</td>\n",
       "      <td>34.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15TRUE</th>\n",
       "      <td>88.6</td>\n",
       "      <td>88.3</td>\n",
       "      <td>84.6</td>\n",
       "      <td>86.3</td>\n",
       "      <td>62.2</td>\n",
       "      <td>54.4</td>\n",
       "      <td>28.0</td>\n",
       "      <td>38.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19TRUE</th>\n",
       "      <td>86.0</td>\n",
       "      <td>86.4</td>\n",
       "      <td>87.0</td>\n",
       "      <td>86.7</td>\n",
       "      <td>45.2</td>\n",
       "      <td>50.5</td>\n",
       "      <td>40.0</td>\n",
       "      <td>42.9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "           RSA                    CDTA                  \n",
       "         sgd10 sgd15 sgd19   all sgd10 sgd15 sgd19   all\n",
       "0 SYN     81.3  84.8  81.6  82.5  32.0  34.9  26.5  29.0\n",
       "  10TURE  92.3  68.1  60.9  68.0  70.0   7.8   3.8  15.5\n",
       "  15TRUE  89.5  87.9  69.8  78.2  57.1  50.7   9.4  25.3\n",
       "  19TRUE  82.5  87.4  87.0  86.4  62.8  57.6  45.9  50.9\n",
       "4 SYN     87.5  85.6  83.7  84.8  42.4  34.6  27.0  31.0\n",
       "  10TURE  92.3  85.5  85.1  86.4  78.4  28.0  25.3  34.5\n",
       "  15TRUE  88.6  88.3  84.6  86.3  62.2  54.4  28.0  38.8\n",
       "  19TRUE  86.0  86.4  87.0  86.7  45.2  50.5  40.0  42.9"
      ]
     },
     "execution_count": 123,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "domain_expand_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{llrrrrrrrr}\n",
      "\\toprule\n",
      "  &     & \\multicolumn{4}{l}{RSA} & \\multicolumn{4}{l}{CDTA} \\\\\n",
      "  &     & sgd10 & sgd15 & sgd19 &   all & sgd10 & sgd15 & sgd19 &   all \\\\\n",
      "\\midrule\n",
      "0 & 10SYN &  83.4 &  80.4 &  74.7 &  77.7 &  30.6 &  17.0 &  14.5 &  17.2 \\\\\n",
      "  & 15SYN &  83.1 &  85.1 &  76.3 &  79.9 &  44.2 &  23.9 &  19.9 &  24.1 \\\\\n",
      "  & SYN &  81.3 &  84.8 &  81.6 &  82.5 &  33.5 &  27.2 &  23.6 &  25.8 \\\\\n",
      "4 & 10SYN &  87.0 &  84.1 &  82.1 &  83.5 &  38.0 &  27.7 &  21.0 &  24.8 \\\\\n",
      "  & 15SYN &  85.3 &  85.5 &  83.0 &  84.1 &  32.2 &  27.4 &  20.4 &  23.7 \\\\\n",
      "  & SYN &  87.5 &  85.6 &  83.7 &  84.8 &  38.4 &  27.2 &  24.3 &  26.9 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_50930/705736087.py:1: FutureWarning: In future versions `DataFrame.to_latex` is expected to utilise the base implementation of `Styler.to_latex` for formatting and rendering. The arguments signature may therefore change. It is recommended instead to use `DataFrame.style.to_latex` which also contains additional functionality.\n",
      "  print(domain_expand_table.to_latex())\n"
     ]
    }
   ],
   "source": [
    "print(domain_expand_table.to_latex())"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### CoQR"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"3\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"3\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>JGA</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>JGA</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>\\singleConcat</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-Zero</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-ChatGPT</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-SYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleConcatRel</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (1x)</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (4x)</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYNN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Real</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 sgd/group0           multiwoz21          \n",
       "                        JGA  RSA CDTA        JGA  RSA CDTA\n",
       "\\singleConcat           NaN  NaN  NaN        NaN  NaN  NaN\n",
       "CoQR-Zero               NaN  NaN  NaN        NaN  NaN  NaN\n",
       "CoQR-ChatGPT            NaN  NaN  NaN        NaN  NaN  NaN\n",
       "CoQR-SYN                NaN  NaN  NaN        NaN  NaN  NaN\n",
       "\\singleConcatRel        NaN  NaN  NaN        NaN  NaN  NaN\n",
       "\\singleSYN              NaN  NaN  NaN        NaN  NaN  NaN\n",
       "\\singleSYN (1x)         NaN  NaN  NaN        NaN  NaN  NaN\n",
       "\\singleSYN (4x)         NaN  NaN  NaN        NaN  NaN  NaN\n",
       "\\singleSYNN             NaN  NaN  NaN        NaN  NaN  NaN\n",
       "Real                    NaN  NaN  NaN        NaN  NaN  NaN"
      ]
     },
     "execution_count": 45,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "aug_types = [(2, 2.0), (2, 2.0), (2, 2.0), (2, 2.0), (4, 2.0), (5, 2.0), (5, 1.0), (5, 4.0), (11, 2.0), (1, 0.1)]\n",
    "index_names = ['\\singleConcat', 'CoQR-Zero', 'CoQR-ChatGPT', 'CoQR-SYN', '\\singleConcatRel', '\\singleSYN', '\\singleSYN (1x)', '\\singleSYN (4x)', '\\singleSYNN', 'Real']\n",
    "datasets = ['sgd/group0', 'multiwoz21']\n",
    "coqr_test_table = pd.DataFrame(index=index_names, \n",
    "                               columns=pd.MultiIndex.from_product([datasets, ['JGA', 'RSA', 'CDTA']]))\n",
    "                            #    columns=pd.MultiIndex.from_product([datasets, column_names, ['all']+[f'domain_{i}' for i in range(1,5)]]))\n",
    "coqr_test_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "output0615/sgd/group0/qadst_f1_th>0.1/t5-large_aug2_x2.0_model0_context100/test_multi_domain_coqr_canard_result_ori_cdta.md\n",
      "output0615/multiwoz21/qadst_f1_th>0.1/t5-large_aug2_x2.0_model0_context100/test_multi_domain_coqr_canard_result_ori_cdta.md\n",
      "output0615/sgd/group0/qadst_f1_th>0.1/t5-large_aug2_x2.0_model0_context100/test_multi_domain_coqr_chatgpt_result_ori_cdta.md\n",
      "output0615/multiwoz21/qadst_f1_th>0.1/t5-large_aug2_x2.0_model0_context100/test_multi_domain_coqr_chatgpt_result_ori_cdta.md\n",
      "output0615/sgd/group0/qadst_f1_th>0.1/t5-large_aug2_x2.0_model0_context100/test_multi_domain_coqr_result_ori_cdta.md\n",
      "output0615/multiwoz21/qadst_f1_th>0.1/t5-large_aug2_x2.0_model0_context100/test_multi_domain_coqr_result_ori_cdta.md\n",
      "output0615/sgd/group0/qadst_f1_th>0.1/t5-large_aug4_x2.0_model0_context100/test_multi_domain_result_ori_cdta.md\n",
      "output0615/multiwoz21/qadst_f1_th>0.1/t5-large_aug4_x2.0_model0_context100/test_multi_domain_result_ori_cdta.md\n",
      "output0615/sgd/group0/qadst_f1_th>0.1/t5-large_aug5_x1.0_model0_context100/test_multi_domain_result_ori_cdta.md\n",
      "output0615/multiwoz21/qadst_f1_th>0.1/t5-large_aug5_x1.0_model0_context100/test_multi_domain_result_ori_cdta.md\n",
      "output0615/sgd/group0/qadst_f1_th>0.1/t5-large_aug5_x4.0_model0_context100/test_multi_domain_result_ori_cdta.md\n",
      "output0615/multiwoz21/qadst_f1_th>0.1/t5-large_aug5_x4.0_model0_context100/test_multi_domain_result_ori_cdta.md\n",
      "output0615/sgd/group0/qadst_f1_th>0.1/t5-large_aug11_x2.0_model0_context100/test_multi_domain_result_ori_cdta.md\n",
      "output0615/multiwoz21/qadst_f1_th>0.1/t5-large_aug11_x2.0_model0_context100/test_multi_domain_result_ori_cdta.md\n",
      "output0615/multiwoz21/qadst_f1_th>0.1/t5-large_aug1_x0.1_model0_context100/test_multi_domain_result_ori_cdta.md\n"
     ]
    }
   ],
   "source": [
    "table = coqr_test_table\n",
    "for i, (aug_type, aug_times) in enumerate(aug_types):\n",
    "    index_name = index_names[i]\n",
    "    for dataset in datasets:\n",
    "        res_dir = f'output0615/{dataset}/qadst_f1_th>0.1/t5-large_aug{aug_type}_x{aug_times}_model0_context100'\n",
    "        if index_name == 'CoQR-Zero':\n",
    "            res_file = f'{res_dir}/test_multi_domain_coqr_canard_result_ori_cdta.md'\n",
    "        elif index_name == 'CoQR-SYN':\n",
    "            res_file = f'{res_dir}/test_multi_domain_coqr_result_ori_cdta.md'\n",
    "        elif index_name == 'CoQR-ChatGPT':\n",
    "            res_file = f'{res_dir}/test_multi_domain_coqr_chatgpt_result_ori_cdta.md'\n",
    "        else:\n",
    "            res_file = f'{res_dir}/test_multi_domain_result_ori_cdta.md'\n",
    "        if not os.path.exists(res_file):\n",
    "            print(res_file)\n",
    "            continue\n",
    "        df = pd.read_table(res_file, sep='|', index_col=1).dropna(axis=1, how='all').iloc[1:]\n",
    "        df = df.apply(lambda x: x.str.strip())\n",
    "        df = df.rename(columns=str.strip).rename(index=str.strip)\n",
    "        table.loc[index_name, (dataset, 'RSA')] = df.loc['all', 'RSA']\n",
    "        table.loc[index_name, (dataset, 'CDTA')] = df.loc['all', 'CDTA']\n",
    "        table.loc[index_name, (dataset, 'JGA')] = df.loc['all', 'JGA']\n",
    "        # table.loc[index_name, (dataset, 'SRSA')] = df.loc['domain_1', 'RSA']\n",
    "        # res_file = res_file.replace('test_multi_domain', 'test_single_domain')\n",
    "        # df = pd.read_table(res_file, sep='|', index_col=1).dropna(axis=1, how='all').iloc[1:]\n",
    "        # df = df.apply(lambda x: x.str.strip())\n",
    "        # df = df.rename(columns=str.strip).rename(index=str.strip)\n",
    "        # table.loc[index_name, (dataset, 'SRSA')] = df.loc['all', 'RSA']\n",
    "        # table.loc[index_name, (dataset, 'RSA', 'all')] = df.loc['all', 'RSA']\n",
    "        # table.loc[index_name, (dataset, 'CDTA', 'all')] = df.loc['all', 'CDTA']\n",
    "        # for dom_cnt in range(1, 5):\n",
    "        #     table.loc[index_name, (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
    "        #     table.loc[index_name, (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
    "\n",
    "coqr_test_table = coqr_test_table.applymap(lambda x: round(pd.to_numeric(x, errors='coerce') * 100, 1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"3\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"3\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>JGA</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>JGA</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>\\singleConcat</th>\n",
       "      <td>45.6</td>\n",
       "      <td>80.5</td>\n",
       "      <td>1.6</td>\n",
       "      <td>43.4</td>\n",
       "      <td>81.6</td>\n",
       "      <td>11.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-Zero</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-ChatGPT</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-SYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleConcatRel</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN</th>\n",
       "      <td>50.5</td>\n",
       "      <td>82.5</td>\n",
       "      <td>25.8</td>\n",
       "      <td>40.4</td>\n",
       "      <td>81.2</td>\n",
       "      <td>20.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (1x)</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (4x)</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYNN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Real</th>\n",
       "      <td>58.0</td>\n",
       "      <td>86.4</td>\n",
       "      <td>50.5</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 sgd/group0             multiwoz21            \n",
       "                        JGA   RSA  CDTA        JGA   RSA  CDTA\n",
       "\\singleConcat          45.6  80.5   1.6       43.4  81.6  11.2\n",
       "CoQR-Zero               NaN   NaN   NaN        NaN   NaN   NaN\n",
       "CoQR-ChatGPT            NaN   NaN   NaN        NaN   NaN   NaN\n",
       "CoQR-SYN                NaN   NaN   NaN        NaN   NaN   NaN\n",
       "\\singleConcatRel        NaN   NaN   NaN        NaN   NaN   NaN\n",
       "\\singleSYN             50.5  82.5  25.8       40.4  81.2  20.9\n",
       "\\singleSYN (1x)         NaN   NaN   NaN        NaN   NaN   NaN\n",
       "\\singleSYN (4x)         NaN   NaN   NaN        NaN   NaN   NaN\n",
       "\\singleSYNN             NaN   NaN   NaN        NaN   NaN   NaN\n",
       "Real                   58.0  86.4  50.5        NaN   NaN   NaN"
      ]
     },
     "execution_count": 47,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "coqr_test_table # model0"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"2\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"2\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>\\singleConcat</th>\n",
       "      <td>82.5</td>\n",
       "      <td>1.8</td>\n",
       "      <td>83.2</td>\n",
       "      <td>11.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-Zero</th>\n",
       "      <td>75.8</td>\n",
       "      <td>16.6</td>\n",
       "      <td>78.9</td>\n",
       "      <td>11.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-ChatGPT</th>\n",
       "      <td>80.5</td>\n",
       "      <td>26.8</td>\n",
       "      <td>81.4</td>\n",
       "      <td>24.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-SYN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleConcatRel</th>\n",
       "      <td>82.8</td>\n",
       "      <td>4.4</td>\n",
       "      <td>82.7</td>\n",
       "      <td>20.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN</th>\n",
       "      <td>84.4</td>\n",
       "      <td>21.1</td>\n",
       "      <td>81.5</td>\n",
       "      <td>27.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (1x)</th>\n",
       "      <td>85.0</td>\n",
       "      <td>24.0</td>\n",
       "      <td>81.7</td>\n",
       "      <td>28.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (4x)</th>\n",
       "      <td>83.8</td>\n",
       "      <td>26.5</td>\n",
       "      <td>81.2</td>\n",
       "      <td>29.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYNN</th>\n",
       "      <td>85.5</td>\n",
       "      <td>27.4</td>\n",
       "      <td>82.0</td>\n",
       "      <td>30.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Real</th>\n",
       "      <td>86.7</td>\n",
       "      <td>39.6</td>\n",
       "      <td>83.4</td>\n",
       "      <td>31.4</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 sgd/group0       multiwoz21      \n",
       "                        RSA  CDTA        RSA  CDTA\n",
       "\\singleConcat          82.5   1.8       83.2  11.1\n",
       "CoQR-Zero              75.8  16.6       78.9  11.4\n",
       "CoQR-ChatGPT           80.5  26.8       81.4  24.7\n",
       "CoQR-SYN                NaN   NaN        NaN   NaN\n",
       "\\singleConcatRel       82.8   4.4       82.7  20.2\n",
       "\\singleSYN             84.4  21.1       81.5  27.6\n",
       "\\singleSYN (1x)        85.0  24.0       81.7  28.4\n",
       "\\singleSYN (4x)        83.8  26.5       81.2  29.8\n",
       "\\singleSYNN            85.5  27.4       82.0  30.1\n",
       "Real                   86.7  39.6       83.4  31.4"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "coqr_test_table # model4"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"2\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"2\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>\\singleConcat</th>\n",
       "      <td>84.0</td>\n",
       "      <td>1.7</td>\n",
       "      <td>84.1</td>\n",
       "      <td>8.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-Zero</th>\n",
       "      <td>76.5</td>\n",
       "      <td>17.9</td>\n",
       "      <td>79.6</td>\n",
       "      <td>9.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-ChatGPT</th>\n",
       "      <td>81.2</td>\n",
       "      <td>27.3</td>\n",
       "      <td>82.3</td>\n",
       "      <td>24.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-SYN</th>\n",
       "      <td>85.6</td>\n",
       "      <td>17.8</td>\n",
       "      <td>83.8</td>\n",
       "      <td>22.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleConcatRel</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN</th>\n",
       "      <td>86.0</td>\n",
       "      <td>19.7</td>\n",
       "      <td>83.2</td>\n",
       "      <td>27.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (1x)</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (4x)</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYNN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Real</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 sgd/group0       multiwoz21      \n",
       "                        RSA  CDTA        RSA  CDTA\n",
       "\\singleConcat          84.0   1.7       84.1   8.3\n",
       "CoQR-Zero              76.5  17.9       79.6   9.4\n",
       "CoQR-ChatGPT           81.2  27.3       82.3  24.8\n",
       "CoQR-SYN               85.6  17.8       83.8  22.6\n",
       "\\singleConcatRel        NaN   NaN        NaN   NaN\n",
       "\\singleSYN             86.0  19.7       83.2  27.7\n",
       "\\singleSYN (1x)         NaN   NaN        NaN   NaN\n",
       "\\singleSYN (4x)         NaN   NaN        NaN   NaN\n",
       "\\singleSYNN             NaN   NaN        NaN   NaN\n",
       "Real                    NaN   NaN        NaN   NaN"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "coqr_test_table # model7"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"2\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"2\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>\\singleConcat</th>\n",
       "      <td>80.9</td>\n",
       "      <td>0.5</td>\n",
       "      <td>81.8</td>\n",
       "      <td>7.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-Zero</th>\n",
       "      <td>73.3</td>\n",
       "      <td>16.0</td>\n",
       "      <td>77.5</td>\n",
       "      <td>8.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-ChatGPT</th>\n",
       "      <td>78.4</td>\n",
       "      <td>25.7</td>\n",
       "      <td>80.0</td>\n",
       "      <td>23.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-SYN</th>\n",
       "      <td>82.7</td>\n",
       "      <td>16.9</td>\n",
       "      <td>81.5</td>\n",
       "      <td>21.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleConcatRel</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN</th>\n",
       "      <td>82.7</td>\n",
       "      <td>21.8</td>\n",
       "      <td>80.7</td>\n",
       "      <td>29.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (1x)</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (4x)</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYNN</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Real</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 sgd/group0       multiwoz21      \n",
       "                        RSA  CDTA        RSA  CDTA\n",
       "\\singleConcat          80.9   0.5       81.8   7.3\n",
       "CoQR-Zero              73.3  16.0       77.5   8.1\n",
       "CoQR-ChatGPT           78.4  25.7       80.0  23.0\n",
       "CoQR-SYN               82.7  16.9       81.5  21.6\n",
       "\\singleConcatRel        NaN   NaN        NaN   NaN\n",
       "\\singleSYN             82.7  21.8       80.7  29.1\n",
       "\\singleSYN (1x)         NaN   NaN        NaN   NaN\n",
       "\\singleSYN (4x)         NaN   NaN        NaN   NaN\n",
       "\\singleSYNN             NaN   NaN        NaN   NaN\n",
       "Real                    NaN   NaN        NaN   NaN"
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "coqr_test_table # model5"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"2\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"2\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>\\singleConcat</th>\n",
       "      <td>82.5</td>\n",
       "      <td>1.8</td>\n",
       "      <td>83.2</td>\n",
       "      <td>11.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-Zero</th>\n",
       "      <td>75.8</td>\n",
       "      <td>16.6</td>\n",
       "      <td>78.9</td>\n",
       "      <td>11.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-ChatGPT</th>\n",
       "      <td>80.5</td>\n",
       "      <td>26.8</td>\n",
       "      <td>81.4</td>\n",
       "      <td>24.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-SYN</th>\n",
       "      <td>84.1</td>\n",
       "      <td>17.2</td>\n",
       "      <td>83.1</td>\n",
       "      <td>24.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleConcatRel</th>\n",
       "      <td>82.8</td>\n",
       "      <td>4.4</td>\n",
       "      <td>82.7</td>\n",
       "      <td>20.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN</th>\n",
       "      <td>84.8</td>\n",
       "      <td>26.9</td>\n",
       "      <td>82.2</td>\n",
       "      <td>30.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (1x)</th>\n",
       "      <td>85.0</td>\n",
       "      <td>24.0</td>\n",
       "      <td>81.7</td>\n",
       "      <td>28.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (4x)</th>\n",
       "      <td>83.8</td>\n",
       "      <td>26.5</td>\n",
       "      <td>81.2</td>\n",
       "      <td>29.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYNN</th>\n",
       "      <td>85.5</td>\n",
       "      <td>27.4</td>\n",
       "      <td>82.0</td>\n",
       "      <td>30.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Real</th>\n",
       "      <td>86.7</td>\n",
       "      <td>39.6</td>\n",
       "      <td>83.4</td>\n",
       "      <td>31.4</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 sgd/group0       multiwoz21      \n",
       "                        RSA  CDTA        RSA  CDTA\n",
       "\\singleConcat          82.5   1.8       83.2  11.1\n",
       "CoQR-Zero              75.8  16.6       78.9  11.4\n",
       "CoQR-ChatGPT           80.5  26.8       81.4  24.7\n",
       "CoQR-SYN               84.1  17.2       83.1  24.0\n",
       "\\singleConcatRel       82.8   4.4       82.7  20.2\n",
       "\\singleSYN             84.8  26.9       82.2  30.8\n",
       "\\singleSYN (1x)        85.0  24.0       81.7  28.4\n",
       "\\singleSYN (4x)        83.8  26.5       81.2  29.8\n",
       "\\singleSYNN            85.5  27.4       82.0  30.1\n",
       "Real                   86.7  39.6       83.4  31.4"
      ]
     },
     "execution_count": 40,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# coqr_test_table = coqr_test_table.drop(columns=[('multiwoz21', 'RSA', 'domain_4'),('multiwoz21', 'CDTA', 'domain_4'),\n",
    "#                                               ('multiwoz21', 'CDTA', 'domain_1'), \n",
    "#                                             #   ('multiwoz21', 'CDTA', 'domain_3'), ('multiwoz21', 'CDTA', 'domain_4'),\n",
    "#                                               ('sgd/group0', 'CDTA', 'domain_1'), \n",
    "#                                             #   ('sgd/group0', 'CDTA', 'domain_3'), ('sgd/group0', 'CDTA', 'domain_4'),\n",
    "#                                               ])\n",
    "coqr_test_table # 0620 ori cdta"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 165,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"9\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"7\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"5\" halign=\"left\">RSA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">CDTA</th>\n",
       "      <th colspan=\"4\" halign=\"left\">RSA</th>\n",
       "      <th colspan=\"3\" halign=\"left\">CDTA</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>all</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "      <th>all</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>domain_4</th>\n",
       "      <th>all</th>\n",
       "      <th>domain_1</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "      <th>all</th>\n",
       "      <th>domain_2</th>\n",
       "      <th>domain_3</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>\\singleConcat</th>\n",
       "      <td>82.5</td>\n",
       "      <td>93.9</td>\n",
       "      <td>76.9</td>\n",
       "      <td>74.7</td>\n",
       "      <td>50.9</td>\n",
       "      <td>8.8</td>\n",
       "      <td>7.8</td>\n",
       "      <td>16.3</td>\n",
       "      <td>1.5</td>\n",
       "      <td>83.2</td>\n",
       "      <td>85.3</td>\n",
       "      <td>83.6</td>\n",
       "      <td>68.4</td>\n",
       "      <td>37.3</td>\n",
       "      <td>49.9</td>\n",
       "      <td>10.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-Zero</th>\n",
       "      <td>75.8</td>\n",
       "      <td>84.3</td>\n",
       "      <td>71.5</td>\n",
       "      <td>70.7</td>\n",
       "      <td>47.3</td>\n",
       "      <td>20.0</td>\n",
       "      <td>19.2</td>\n",
       "      <td>23.5</td>\n",
       "      <td>23.1</td>\n",
       "      <td>78.9</td>\n",
       "      <td>81.9</td>\n",
       "      <td>78.4</td>\n",
       "      <td>64.9</td>\n",
       "      <td>33.3</td>\n",
       "      <td>43.0</td>\n",
       "      <td>12.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-SYN</th>\n",
       "      <td>84.1</td>\n",
       "      <td>93.6</td>\n",
       "      <td>79.6</td>\n",
       "      <td>76.5</td>\n",
       "      <td>58.0</td>\n",
       "      <td>22.9</td>\n",
       "      <td>23.5</td>\n",
       "      <td>17.0</td>\n",
       "      <td>33.8</td>\n",
       "      <td>83.1</td>\n",
       "      <td>85.4</td>\n",
       "      <td>82.5</td>\n",
       "      <td>73.2</td>\n",
       "      <td>44.0</td>\n",
       "      <td>51.2</td>\n",
       "      <td>28.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN</th>\n",
       "      <td>84.8</td>\n",
       "      <td>92.9</td>\n",
       "      <td>81.3</td>\n",
       "      <td>77.0</td>\n",
       "      <td>66.7</td>\n",
       "      <td>31.0</td>\n",
       "      <td>32.5</td>\n",
       "      <td>20.8</td>\n",
       "      <td>36.9</td>\n",
       "      <td>82.2</td>\n",
       "      <td>84.8</td>\n",
       "      <td>81.8</td>\n",
       "      <td>70.4</td>\n",
       "      <td>45.5</td>\n",
       "      <td>56.8</td>\n",
       "      <td>21.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleConcatRel</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 sgd/group0                                            \\\n",
       "                        RSA                                      CDTA   \n",
       "                        all domain_1 domain_2 domain_3 domain_4   all   \n",
       "\\singleConcat          82.5     93.9     76.9     74.7     50.9   8.8   \n",
       "CoQR-Zero              75.8     84.3     71.5     70.7     47.3  20.0   \n",
       "CoQR-SYN               84.1     93.6     79.6     76.5     58.0  22.9   \n",
       "\\singleSYN             84.8     92.9     81.3     77.0     66.7  31.0   \n",
       "\\singleConcatRel        NaN      NaN      NaN      NaN      NaN   NaN   \n",
       "\n",
       "                                            multiwoz21                    \\\n",
       "                                                   RSA                     \n",
       "                 domain_2 domain_3 domain_4        all domain_1 domain_2   \n",
       "\\singleConcat         7.8     16.3      1.5       83.2     85.3     83.6   \n",
       "CoQR-Zero            19.2     23.5     23.1       78.9     81.9     78.4   \n",
       "CoQR-SYN             23.5     17.0     33.8       83.1     85.4     82.5   \n",
       "\\singleSYN           32.5     20.8     36.9       82.2     84.8     81.8   \n",
       "\\singleConcatRel      NaN      NaN      NaN        NaN      NaN      NaN   \n",
       "\n",
       "                                                   \n",
       "                           CDTA                    \n",
       "                 domain_3   all domain_2 domain_3  \n",
       "\\singleConcat        68.4  37.3     49.9     10.1  \n",
       "CoQR-Zero            64.9  33.3     43.0     12.5  \n",
       "CoQR-SYN             73.2  44.0     51.2     28.5  \n",
       "\\singleSYN           70.4  45.5     56.8     21.2  \n",
       "\\singleConcatRel      NaN   NaN      NaN      NaN  "
      ]
     },
     "execution_count": 165,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "coqr_test_table = coqr_test_table.drop(columns=[('multiwoz21', 'RSA', 'domain_4'),('multiwoz21', 'CDTA', 'domain_4'),\n",
    "                                              ('multiwoz21', 'CDTA', 'domain_1'), \n",
    "                                            #   ('multiwoz21', 'CDTA', 'domain_3'), ('multiwoz21', 'CDTA', 'domain_4'),\n",
    "                                              ('sgd/group0', 'CDTA', 'domain_1'), \n",
    "                                            #   ('sgd/group0', 'CDTA', 'domain_3'), ('sgd/group0', 'CDTA', 'domain_4'),\n",
    "                                              ])\n",
    "# for i, (aug_type, aug_times) in enumerate(aug_types):\n",
    "#     index_name = index_names[i]\n",
    "#     main_exp_table = main_exp_table.drop(index=('MinTL', index_name, 4))\n",
    "coqr_test_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 135,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"2\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"2\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>\\singleConcat</th>\n",
       "      <td>82.5</td>\n",
       "      <td>8.8</td>\n",
       "      <td>83.2</td>\n",
       "      <td>37.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleConcatRel</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN</th>\n",
       "      <td>84.8</td>\n",
       "      <td>31.0</td>\n",
       "      <td>82.2</td>\n",
       "      <td>45.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYNN</th>\n",
       "      <td>85.5</td>\n",
       "      <td>31.9</td>\n",
       "      <td>82.0</td>\n",
       "      <td>46.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Real</th>\n",
       "      <td>86.7</td>\n",
       "      <td>42.9</td>\n",
       "      <td>83.4</td>\n",
       "      <td>48.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-C</th>\n",
       "      <td>75.8</td>\n",
       "      <td>20.0</td>\n",
       "      <td>78.9</td>\n",
       "      <td>33.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>CoQR-S</th>\n",
       "      <td>84.1</td>\n",
       "      <td>22.9</td>\n",
       "      <td>83.1</td>\n",
       "      <td>44.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (1x)</th>\n",
       "      <td>85.0</td>\n",
       "      <td>27.9</td>\n",
       "      <td>81.7</td>\n",
       "      <td>43.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>\\singleSYN (4x)</th>\n",
       "      <td>83.8</td>\n",
       "      <td>30.7</td>\n",
       "      <td>81.2</td>\n",
       "      <td>43.9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 sgd/group0       multiwoz21      \n",
       "                        RSA  CDTA        RSA  CDTA\n",
       "\\singleConcat          82.5   8.8       83.2  37.3\n",
       "\\singleConcatRel        NaN   NaN        NaN   NaN\n",
       "\\singleSYN             84.8  31.0       82.2  45.5\n",
       "\\singleSYNN            85.5  31.9       82.0  46.1\n",
       "Real                   86.7  42.9       83.4  48.0\n",
       "CoQR-C                 75.8  20.0       78.9  33.3\n",
       "CoQR-S                 84.1  22.9       83.1  44.0\n",
       "\\singleSYN (1x)        85.0  27.9       81.7  43.5\n",
       "\\singleSYN (4x)        83.8  30.7       81.2  43.9"
      ]
     },
     "execution_count": 135,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "coqr_test_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lrrrr}\n",
      "\\toprule\n",
      "{} & \\multicolumn{2}{l}{sgd/group0} & \\multicolumn{2}{l}{multiwoz21} \\\\\n",
      "{} &        RSA &  CDTA &        RSA &  CDTA \\\\\n",
      "\\midrule\n",
      "\\textbackslash singleConcat    &       80.9 &   0.5 &       81.8 &   7.3 \\\\\n",
      "CoQR-Zero        &       73.3 &  16.0 &       77.5 &   8.1 \\\\\n",
      "CoQR-ChatGPT     &       78.4 &  25.7 &       80.0 &  23.0 \\\\\n",
      "CoQR-SYN         &       82.7 &  16.9 &       81.5 &  21.6 \\\\\n",
      "\\textbackslash singleConcatRel &        NaN &   NaN &        NaN &   NaN \\\\\n",
      "\\textbackslash singleSYN       &       82.7 &  21.8 &       80.7 &  29.1 \\\\\n",
      "\\textbackslash singleSYN (1x)  &        NaN &   NaN &        NaN &   NaN \\\\\n",
      "\\textbackslash singleSYN (4x)  &        NaN &   NaN &        NaN &   NaN \\\\\n",
      "\\textbackslash singleSYNN      &        NaN &   NaN &        NaN &   NaN \\\\\n",
      "Real             &        NaN &   NaN &        NaN &   NaN \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_33250/3055608670.py:1: FutureWarning: In future versions `DataFrame.to_latex` is expected to utilise the base implementation of `Styler.to_latex` for formatting and rendering. The arguments signature may therefore change. It is recommended instead to use `DataFrame.style.to_latex` which also contains additional functionality.\n",
      "  print(coqr_test_table.to_latex())\n"
     ]
    }
   ],
   "source": [
    "print(coqr_test_table.to_latex())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 113,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lrrrrrrrrrr}\n",
      "\\toprule\n",
      "{} & \\multicolumn{5}{l}{multiwoz21} & \\multicolumn{5}{l}{sgd/group0} \\\\\n",
      "{} &  Multi JGA & Multi TA & Multi CDTA & Cross JGA & Single JGA &  Multi JGA & Multi TA & Multi CDTA & Cross JGA & Single JGA \\\\\n",
      "\\midrule\n",
      "Single+Concat (2x) &       39.5 &     74.1 &        5.6 &      28.9 &       63.6 &       36.3 &     78.3 &        1.3 &      35.2 &       83.3 \\\\\n",
      "w/ CANARD          &       34.5 &     70.3 &        6.2 &      26.6 &       59.2 &       30.0 &     71.0 &       13.7 &      30.4 &       64.6 \\\\\n",
      "w/ CANARD+MIX      &       39.4 &     73.7 &       16.6 &      30.0 &       63.4 &       39.5 &     78.7 &       18.1 &      39.5 &       82.2 \\\\\n",
      "w/ ChatGPT         &       36.3 &     70.6 &       17.0 &      27.4 &       61.1 &       32.3 &     72.7 &       22.7 &      32.1 &       66.2 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_88698/2481759033.py:1: FutureWarning: In future versions `DataFrame.to_latex` is expected to utilise the base implementation of `Styler.to_latex` for formatting and rendering. The arguments signature may therefore change. It is recommended instead to use `DataFrame.style.to_latex` which also contains additional functionality.\n",
      "  print(coqr_test_table.loc['turn'].to_latex())\n"
     ]
    }
   ],
   "source": [
    "print(coqr_test_table.loc['turn'].to_latex())"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Ablation"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"5\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"5\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>Ratio</th>\n",
       "      <th>Precision</th>\n",
       "      <th>Recall</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>Ratio</th>\n",
       "      <th>Precision</th>\n",
       "      <th>Recall</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>F1&gt;0</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.01</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.1</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.3</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.5</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.8</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.1&amp;TRUE_DOM</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>TRUE_SLOT</th>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                sgd/group0                             multiwoz21             \\\n",
       "                       RSA CDTA Ratio Precision Recall        RSA CDTA Ratio   \n",
       "F1>0                   NaN  NaN   NaN       NaN    NaN        NaN  NaN   NaN   \n",
       "F1>0.01                NaN  NaN   NaN       NaN    NaN        NaN  NaN   NaN   \n",
       "F1>0.1                 NaN  NaN   NaN       NaN    NaN        NaN  NaN   NaN   \n",
       "F1>0.3                 NaN  NaN   NaN       NaN    NaN        NaN  NaN   NaN   \n",
       "F1>0.5                 NaN  NaN   NaN       NaN    NaN        NaN  NaN   NaN   \n",
       "F1>0.8                 NaN  NaN   NaN       NaN    NaN        NaN  NaN   NaN   \n",
       "F1>0.1&TRUE_DOM        NaN  NaN   NaN       NaN    NaN        NaN  NaN   NaN   \n",
       "TRUE_SLOT              NaN  NaN   NaN       NaN    NaN        NaN  NaN   NaN   \n",
       "\n",
       "                                  \n",
       "                Precision Recall  \n",
       "F1>0                  NaN    NaN  \n",
       "F1>0.01               NaN    NaN  \n",
       "F1>0.1                NaN    NaN  \n",
       "F1>0.3                NaN    NaN  \n",
       "F1>0.5                NaN    NaN  \n",
       "F1>0.8                NaN    NaN  \n",
       "F1>0.1&TRUE_DOM       NaN    NaN  \n",
       "TRUE_SLOT             NaN    NaN  "
      ]
     },
     "execution_count": 80,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "qadst_dirs = ['qadst_f1_th>0', 'qadst_f1_th>0.01', 'qadst_f1_th>0.1', 'qadst_f1_th>0.3', 'qadst_f1_th>0.5', 'qadst_f1_th>0.8', 'qadst_f1_th>0.1_true_domain_comb', 'qadst_true_slot_pairs']\n",
    "aug_types = [(5, 2.0)]*len(qadst_dirs)\n",
    "index_names = ['F1>0', 'F1>0.01', 'F1>0.1', 'F1>0.3', 'F1>0.5', 'F1>0.8', 'F1>0.1&TRUE_DOM', 'TRUE_SLOT']\n",
    "datasets = ['sgd/group0', 'multiwoz21']\n",
    "ablation_table = pd.DataFrame(index=index_names, \n",
    "                               columns=pd.MultiIndex.from_product([datasets, ['RSA', 'CDTA', 'Ratio', 'Precision', 'Recall']]))\n",
    "                            #    columns=pd.MultiIndex.from_product([datasets, column_names, ['all']+[f'domain_{i}' for i in range(1,5)]]))\n",
    "ablation_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 81,
   "metadata": {},
   "outputs": [],
   "source": [
    "table = ablation_table\n",
    "for i, (aug_type, aug_times) in enumerate(aug_types):\n",
    "    qadst_dir = qadst_dirs[i]\n",
    "    index_name = index_names[i]\n",
    "    for dataset in datasets:\n",
    "        res_dir = f'output0615/{dataset}/{qadst_dir}/t5-large_aug{aug_type}_x{aug_times}_model4_context100'\n",
    "        res_file = f'{res_dir}/test_multi_domain_result_ori_cdta.md'\n",
    "        if not os.path.exists(res_file):\n",
    "            continue\n",
    "        df = pd.read_table(res_file, sep='|', index_col=1).dropna(axis=1, how='all').iloc[1:]\n",
    "        df = df.apply(lambda x: x.str.strip())\n",
    "        df = df.rename(columns=str.strip).rename(index=str.strip)\n",
    "        table.loc[index_name, (dataset, 'RSA')] = df.loc['all', 'RSA']\n",
    "        table.loc[index_name, (dataset, 'CDTA')] = df.loc['all', 'CDTA']\n",
    "        # table.loc[index_name, (dataset, 'RSA', 'all')] = df.loc['all', 'RSA']\n",
    "        # table.loc[index_name, (dataset, 'CDTA', 'all')] = df.loc['all', 'CDTA']\n",
    "        # for dom_cnt in range(1, 5):\n",
    "        #     table.loc[index_name, (dataset, 'RSA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'RSA']\n",
    "        #     table.loc[index_name, (dataset, 'CDTA', f'domain_{dom_cnt}')] = df.loc[f'domain_{dom_cnt}', 'CDTA']\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 82,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"5\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"5\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>Ratio</th>\n",
       "      <th>Precision</th>\n",
       "      <th>Recall</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>Ratio</th>\n",
       "      <th>Precision</th>\n",
       "      <th>Recall</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>F1&gt;0</th>\n",
       "      <td>0.8455318300347572</td>\n",
       "      <td>0.26227738801942796</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.8189786188385456</td>\n",
       "      <td>0.29117876658860264</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.01</th>\n",
       "      <td>0.8430816095835237</td>\n",
       "      <td>0.24662709120345386</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.8250100191216666</td>\n",
       "      <td>0.3091334894613583</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.1</th>\n",
       "      <td>0.8483298514948231</td>\n",
       "      <td>0.26875337290879653</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.822339879389787</td>\n",
       "      <td>0.3075722092115535</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.3</th>\n",
       "      <td>0.8515074526539687</td>\n",
       "      <td>0.23961144090663788</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.818364395259508</td>\n",
       "      <td>0.30601092896174864</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.5</th>\n",
       "      <td>0.8508244686320376</td>\n",
       "      <td>0.26227738801942796</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.8147157497006207</td>\n",
       "      <td>0.2693208430913349</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.8</th>\n",
       "      <td>0.8392410054259714</td>\n",
       "      <td>0.18078791149487317</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.8165034655316281</td>\n",
       "      <td>0.2154566744730679</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.1&amp;TRUE_DOM</th>\n",
       "      <td>0.8449357245312612</td>\n",
       "      <td>0.24986508364813814</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.8185428005688219</td>\n",
       "      <td>0.29430132708821233</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>TRUE_SLOT</th>\n",
       "      <td>0.8642971086118983</td>\n",
       "      <td>0.3059902860226659</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>0.8268752468589738</td>\n",
       "      <td>0.3473848555815769</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                         sgd/group0                                       \\\n",
       "                                RSA                 CDTA Ratio Precision   \n",
       "F1>0             0.8455318300347572  0.26227738801942796   NaN       NaN   \n",
       "F1>0.01          0.8430816095835237  0.24662709120345386   NaN       NaN   \n",
       "F1>0.1           0.8483298514948231  0.26875337290879653   NaN       NaN   \n",
       "F1>0.3           0.8515074526539687  0.23961144090663788   NaN       NaN   \n",
       "F1>0.5           0.8508244686320376  0.26227738801942796   NaN       NaN   \n",
       "F1>0.8           0.8392410054259714  0.18078791149487317   NaN       NaN   \n",
       "F1>0.1&TRUE_DOM  0.8449357245312612  0.24986508364813814   NaN       NaN   \n",
       "TRUE_SLOT        0.8642971086118983   0.3059902860226659   NaN       NaN   \n",
       "\n",
       "                                multiwoz21                             \\\n",
       "                Recall                 RSA                 CDTA Ratio   \n",
       "F1>0               NaN  0.8189786188385456  0.29117876658860264   NaN   \n",
       "F1>0.01            NaN  0.8250100191216666   0.3091334894613583   NaN   \n",
       "F1>0.1             NaN   0.822339879389787   0.3075722092115535   NaN   \n",
       "F1>0.3             NaN   0.818364395259508  0.30601092896174864   NaN   \n",
       "F1>0.5             NaN  0.8147157497006207   0.2693208430913349   NaN   \n",
       "F1>0.8             NaN  0.8165034655316281   0.2154566744730679   NaN   \n",
       "F1>0.1&TRUE_DOM    NaN  0.8185428005688219  0.29430132708821233   NaN   \n",
       "TRUE_SLOT          NaN  0.8268752468589738   0.3473848555815769   NaN   \n",
       "\n",
       "                                  \n",
       "                Precision Recall  \n",
       "F1>0                  NaN    NaN  \n",
       "F1>0.01               NaN    NaN  \n",
       "F1>0.1                NaN    NaN  \n",
       "F1>0.3                NaN    NaN  \n",
       "F1>0.5                NaN    NaN  \n",
       "F1>0.8                NaN    NaN  \n",
       "F1>0.1&TRUE_DOM       NaN    NaN  \n",
       "TRUE_SLOT             NaN    NaN  "
      ]
     },
     "execution_count": 82,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "ablation_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 83,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "sgd/group0\n",
      "87\n",
      "multiwoz21\n",
      "34\n"
     ]
    }
   ],
   "source": [
    "table = ablation_table\n",
    "for dataset in datasets:\n",
    "    print(dataset)\n",
    "    golden_slot_pairs = json.load(open(f'data/{dataset}/multi_domain_slot_pairs.json'))\n",
    "    print(len(golden_slot_pairs))\n",
    "    # total_slot_pairs = 143 if dataset == 'multiwoz21' else 889\n",
    "    total_slot_pairs = 690 if dataset == 'multiwoz21' else 9972\n",
    "    for index_name, qadst_dir in zip(index_names, qadst_dirs):\n",
    "        pred_slot_pairs = json.load(open(f'data/{dataset}/{qadst_dir}/aug5_x2.0/coqr_slot_pairs.json'))\n",
    "        precision, recall, f1 = eval_slot_pairs_prediction(set(golden_slot_pairs.keys()), set(pred_slot_pairs.keys()))\n",
    "        # print(f'{qadst_dir}, precision={precision:.2f}, recall={recall:.2f}, f1={f1:.2f}, size={len(pred_slot_pairs)}, filtered_ratio={len(pred_slot_pairs)/total_slot_pairs:.2f}')\n",
    "        table.loc[index_name, (dataset, 'Ratio')] = len(pred_slot_pairs)/total_slot_pairs\n",
    "        table.loc[index_name, (dataset, 'Precision')] = precision\n",
    "        table.loc[index_name, (dataset, 'Recall')] = recall\n",
    "\n",
    "ablation_table = ablation_table.applymap(lambda x: round(pd.to_numeric(x, errors='coerce') * 100, 1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 84,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"5\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"5\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>Ratio</th>\n",
       "      <th>Precision</th>\n",
       "      <th>Recall</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>Ratio</th>\n",
       "      <th>Precision</th>\n",
       "      <th>Recall</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>F1&gt;0</th>\n",
       "      <td>84.6</td>\n",
       "      <td>26.2</td>\n",
       "      <td>4.7</td>\n",
       "      <td>10.9</td>\n",
       "      <td>58.6</td>\n",
       "      <td>81.9</td>\n",
       "      <td>29.1</td>\n",
       "      <td>14.9</td>\n",
       "      <td>29.1</td>\n",
       "      <td>88.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.01</th>\n",
       "      <td>84.3</td>\n",
       "      <td>24.7</td>\n",
       "      <td>4.7</td>\n",
       "      <td>10.9</td>\n",
       "      <td>58.6</td>\n",
       "      <td>82.5</td>\n",
       "      <td>30.9</td>\n",
       "      <td>14.1</td>\n",
       "      <td>33.0</td>\n",
       "      <td>94.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.1</th>\n",
       "      <td>84.8</td>\n",
       "      <td>26.9</td>\n",
       "      <td>4.5</td>\n",
       "      <td>10.8</td>\n",
       "      <td>55.2</td>\n",
       "      <td>82.2</td>\n",
       "      <td>30.8</td>\n",
       "      <td>11.2</td>\n",
       "      <td>35.1</td>\n",
       "      <td>79.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.3</th>\n",
       "      <td>85.2</td>\n",
       "      <td>24.0</td>\n",
       "      <td>4.1</td>\n",
       "      <td>12.0</td>\n",
       "      <td>56.3</td>\n",
       "      <td>81.8</td>\n",
       "      <td>30.6</td>\n",
       "      <td>8.7</td>\n",
       "      <td>41.7</td>\n",
       "      <td>73.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.5</th>\n",
       "      <td>85.1</td>\n",
       "      <td>26.2</td>\n",
       "      <td>3.8</td>\n",
       "      <td>11.4</td>\n",
       "      <td>49.4</td>\n",
       "      <td>81.5</td>\n",
       "      <td>26.9</td>\n",
       "      <td>7.1</td>\n",
       "      <td>46.9</td>\n",
       "      <td>67.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.8</th>\n",
       "      <td>83.9</td>\n",
       "      <td>18.1</td>\n",
       "      <td>2.8</td>\n",
       "      <td>14.9</td>\n",
       "      <td>47.1</td>\n",
       "      <td>81.7</td>\n",
       "      <td>21.5</td>\n",
       "      <td>2.5</td>\n",
       "      <td>64.7</td>\n",
       "      <td>32.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.1&amp;TRUE_DOM</th>\n",
       "      <td>84.5</td>\n",
       "      <td>25.0</td>\n",
       "      <td>1.3</td>\n",
       "      <td>48.1</td>\n",
       "      <td>73.6</td>\n",
       "      <td>81.9</td>\n",
       "      <td>29.4</td>\n",
       "      <td>9.1</td>\n",
       "      <td>41.3</td>\n",
       "      <td>76.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>TRUE_SLOT</th>\n",
       "      <td>86.4</td>\n",
       "      <td>30.6</td>\n",
       "      <td>0.7</td>\n",
       "      <td>100.0</td>\n",
       "      <td>75.9</td>\n",
       "      <td>82.7</td>\n",
       "      <td>34.7</td>\n",
       "      <td>4.8</td>\n",
       "      <td>100.0</td>\n",
       "      <td>97.1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                sgd/group0                              multiwoz21        \\\n",
       "                       RSA  CDTA Ratio Precision Recall        RSA  CDTA   \n",
       "F1>0                  84.6  26.2   4.7      10.9   58.6       81.9  29.1   \n",
       "F1>0.01               84.3  24.7   4.7      10.9   58.6       82.5  30.9   \n",
       "F1>0.1                84.8  26.9   4.5      10.8   55.2       82.2  30.8   \n",
       "F1>0.3                85.2  24.0   4.1      12.0   56.3       81.8  30.6   \n",
       "F1>0.5                85.1  26.2   3.8      11.4   49.4       81.5  26.9   \n",
       "F1>0.8                83.9  18.1   2.8      14.9   47.1       81.7  21.5   \n",
       "F1>0.1&TRUE_DOM       84.5  25.0   1.3      48.1   73.6       81.9  29.4   \n",
       "TRUE_SLOT             86.4  30.6   0.7     100.0   75.9       82.7  34.7   \n",
       "\n",
       "                                        \n",
       "                Ratio Precision Recall  \n",
       "F1>0             14.9      29.1   88.2  \n",
       "F1>0.01          14.1      33.0   94.1  \n",
       "F1>0.1           11.2      35.1   79.4  \n",
       "F1>0.3            8.7      41.7   73.5  \n",
       "F1>0.5            7.1      46.9   67.6  \n",
       "F1>0.8            2.5      64.7   32.4  \n",
       "F1>0.1&TRUE_DOM   9.1      41.3   76.5  \n",
       "TRUE_SLOT         4.8     100.0   97.1  "
      ]
     },
     "execution_count": 84,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "ablation_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"5\" halign=\"left\">sgd/group0</th>\n",
       "      <th colspan=\"5\" halign=\"left\">multiwoz21</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>Ratio</th>\n",
       "      <th>Precision</th>\n",
       "      <th>Recall</th>\n",
       "      <th>RSA</th>\n",
       "      <th>CDTA</th>\n",
       "      <th>Ratio</th>\n",
       "      <th>Precision</th>\n",
       "      <th>Recall</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>F1&gt;0</th>\n",
       "      <td>84.6</td>\n",
       "      <td>26.2</td>\n",
       "      <td>4.7</td>\n",
       "      <td>10.9</td>\n",
       "      <td>58.6</td>\n",
       "      <td>81.9</td>\n",
       "      <td>29.1</td>\n",
       "      <td>14.9</td>\n",
       "      <td>29.1</td>\n",
       "      <td>88.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.1</th>\n",
       "      <td>84.8</td>\n",
       "      <td>26.9</td>\n",
       "      <td>4.5</td>\n",
       "      <td>10.8</td>\n",
       "      <td>55.2</td>\n",
       "      <td>82.2</td>\n",
       "      <td>30.8</td>\n",
       "      <td>11.2</td>\n",
       "      <td>35.1</td>\n",
       "      <td>79.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.3</th>\n",
       "      <td>85.2</td>\n",
       "      <td>24.0</td>\n",
       "      <td>4.1</td>\n",
       "      <td>12.0</td>\n",
       "      <td>56.3</td>\n",
       "      <td>81.8</td>\n",
       "      <td>30.6</td>\n",
       "      <td>8.7</td>\n",
       "      <td>41.7</td>\n",
       "      <td>73.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.5</th>\n",
       "      <td>85.1</td>\n",
       "      <td>26.2</td>\n",
       "      <td>3.8</td>\n",
       "      <td>11.4</td>\n",
       "      <td>49.4</td>\n",
       "      <td>81.5</td>\n",
       "      <td>26.9</td>\n",
       "      <td>7.1</td>\n",
       "      <td>46.9</td>\n",
       "      <td>67.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>F1&gt;0.8</th>\n",
       "      <td>83.9</td>\n",
       "      <td>18.1</td>\n",
       "      <td>2.8</td>\n",
       "      <td>14.9</td>\n",
       "      <td>47.1</td>\n",
       "      <td>81.7</td>\n",
       "      <td>21.5</td>\n",
       "      <td>2.5</td>\n",
       "      <td>64.7</td>\n",
       "      <td>32.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>TRUE_SLOT</th>\n",
       "      <td>86.4</td>\n",
       "      <td>30.6</td>\n",
       "      <td>0.7</td>\n",
       "      <td>100.0</td>\n",
       "      <td>75.9</td>\n",
       "      <td>82.7</td>\n",
       "      <td>34.7</td>\n",
       "      <td>4.8</td>\n",
       "      <td>100.0</td>\n",
       "      <td>97.1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "          sgd/group0                              multiwoz21              \\\n",
       "                 RSA  CDTA Ratio Precision Recall        RSA  CDTA Ratio   \n",
       "F1>0            84.6  26.2   4.7      10.9   58.6       81.9  29.1  14.9   \n",
       "F1>0.1          84.8  26.9   4.5      10.8   55.2       82.2  30.8  11.2   \n",
       "F1>0.3          85.2  24.0   4.1      12.0   56.3       81.8  30.6   8.7   \n",
       "F1>0.5          85.1  26.2   3.8      11.4   49.4       81.5  26.9   7.1   \n",
       "F1>0.8          83.9  18.1   2.8      14.9   47.1       81.7  21.5   2.5   \n",
       "TRUE_SLOT       86.4  30.6   0.7     100.0   75.9       82.7  34.7   4.8   \n",
       "\n",
       "                            \n",
       "          Precision Recall  \n",
       "F1>0           29.1   88.2  \n",
       "F1>0.1         35.1   79.4  \n",
       "F1>0.3         41.7   73.5  \n",
       "F1>0.5         46.9   67.6  \n",
       "F1>0.8         64.7   32.4  \n",
       "TRUE_SLOT     100.0   97.1  "
      ]
     },
     "execution_count": 78,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "ablation_table.drop(index='F1>0.1&TRUE_DOM').drop(index='F1>0.01')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 79,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lrrrrrrrrrr}\n",
      "\\toprule\n",
      "{} & \\multicolumn{5}{l}{sgd/group0} & \\multicolumn{5}{l}{multiwoz21} \\\\\n",
      "{} &        RSA &  CDTA & Ratio & Precision & Recall &        RSA &  CDTA & Ratio & Precision & Recall \\\\\n",
      "\\midrule\n",
      "F1>0      &       84.6 &  26.2 &   4.7 &      10.9 &   58.6 &       81.9 &  29.1 &  14.9 &      29.1 &   88.2 \\\\\n",
      "F1>0.1    &       84.8 &  26.9 &   4.5 &      10.8 &   55.2 &       82.2 &  30.8 &  11.2 &      35.1 &   79.4 \\\\\n",
      "F1>0.3    &       85.2 &  24.0 &   4.1 &      12.0 &   56.3 &       81.8 &  30.6 &   8.7 &      41.7 &   73.5 \\\\\n",
      "F1>0.5    &       85.1 &  26.2 &   3.8 &      11.4 &   49.4 &       81.5 &  26.9 &   7.1 &      46.9 &   67.6 \\\\\n",
      "F1>0.8    &       83.9 &  18.1 &   2.8 &      14.9 &   47.1 &       81.7 &  21.5 &   2.5 &      64.7 &   32.4 \\\\\n",
      "TRUE\\_SLOT &       86.4 &  30.6 &   0.7 &     100.0 &   75.9 &       82.7 &  34.7 &   4.8 &     100.0 &   97.1 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_103566/327982617.py:1: FutureWarning: In future versions `DataFrame.to_latex` is expected to utilise the base implementation of `Styler.to_latex` for formatting and rendering. The arguments signature may therefore change. It is recommended instead to use `DataFrame.style.to_latex` which also contains additional functionality.\n",
      "  print(ablation_table.drop(index='F1>0.1&TRUE_DOM').drop(index='F1>0.01').to_latex())\n"
     ]
    }
   ],
   "source": [
    "print(ablation_table.drop(index='F1>0.1&TRUE_DOM').drop(index='F1>0.01').to_latex())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.13"
  },
  "vscode": {
   "interpreter": {
    "hash": "0d7e61334dfc0ef49fed574cd0889517bf66c7c88797d6df65d4f14c89b6fa83"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
