{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "93c6c8b1",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{table*}[ht]\n",
      "    \\centering\n",
      "    \\caption{Comparison of performance metrics across penalty configurations.}\n",
      "    \\label{tab:performance_summary}\n",
      "    \\providecommand{\\res}[2]{\\begin{tabular}{@{}c@{}}#1\\\\[-3pt]{\\scriptsize (#2)}\\end{tabular}}\n",
      "    \\resizebox{0.9\\textwidth}{!}{%\n",
      "    \\begin{tabular}{@{} l ccccc | ccccc @{}}\n",
      "        \\toprule\n",
      "        \\multirow{2}{*}{Model} & \\multicolumn{5}{c}{AUROC} & \\multicolumn{5}{c}{AUPRC} \\\\\n",
      "        \\cmidrule(lr){2-6} \\cmidrule(lr){7-11}\n",
      "         & Weight & Jacob-L1 & Jacob-F & Shap & F-Shap & Weight & Jacob-L1 & Jacob-F & Shap & F-Shap \\\\\n",
      "        \\midrule\n",
      "        MLP & -- & \\res{0.859}{0.026} & \\res{0.844}{0.030} & \\res{0.874}{0.015} & \\res{0.855}{0.025} & -- & \\res{0.645}{0.038} & \\res{0.640}{0.036} & \\res{0.673}{0.021} & \\res{0.659}{0.029} \\\\\n",
      "        cMLP & -- & \\res{0.827}{0.023} & \\res{0.831}{0.018} & \\res{0.854}{0.012} & \\res{0.844}{0.018} & -- & \\res{0.630}{0.020} & \\res{0.633}{0.015} & \\res{0.660}{0.014} & \\res{0.639}{0.021} \\\\\n",
      "        LSTM & -- & \\res{0.836}{0.013} & \\res{0.737}{0.049} & \\res{0.847}{0.003} & \\res{0.713}{0.051} & -- & \\res{0.590}{0.039} & \\res{0.408}{0.071} & \\res{0.672}{0.030} & \\res{0.370}{0.076} \\\\\n",
      "        cLSTM & -- & \\res{0.754}{0.051} & \\res{0.705}{0.043} & \\res{0.797}{0.049} & \\res{0.681}{0.057} & -- & \\res{0.491}{0.061} & \\res{0.388}{0.032} & \\res{0.567}{0.059} & \\res{0.343}{0.065} \\\\\n",
      "        \\bottomrule\n",
      "    \\end{tabular}%\n",
      "    }\n",
      "\\end{table*}\n",
      "Success: Processed 90 records.\n",
      "Outputs: ablation_summary.csv, table_results.tex\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import glob\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "\n",
    "# --- CONFIGURATION ---\n",
    "FOLDER_PATH = './sensitivity_model'\n",
    "\n",
    "# Using a single dictionary for specific output paths\n",
    "OUTPUT_FILE = {\n",
    "    'csv': 'ablation_summary.csv',\n",
    "    'tex': 'table_results.tex'\n",
    "}\n",
    "\n",
    "PENALTY_MAPPING = {\n",
    "    'Weight': 'Weight', 'L2': 'Weight',\n",
    "    'Jacob_L1': 'Jacob-L1',\n",
    "    'Jacob_F': 'Jacob-F',\n",
    "    'Shapley': 'Shap',\n",
    "    'Fast_Shap': 'F-Shap', 'F-Shap': 'F-Shap'\n",
    "}\n",
    "\n",
    "COLUMN_ORDER = ['Weight', 'Jacob-L1', 'Jacob-F', 'Shap', 'F-Shap']\n",
    "MODEL_ORDER = ['MLP', 'cMLP', 'LSTM', 'cLSTM']\n",
    "\n",
    "def escape_tex(text):\n",
    "    \"\"\"Escapes underscores for LaTeX compatibility.\"\"\"\n",
    "    return str(text).replace('_', r'\\_')\n",
    "\n",
    "def parse_filename(filename):\n",
    "    \"\"\"Extracts metadata from filename strings.\"\"\"\n",
    "    base = os.path.basename(filename)\n",
    "    name_no_ext = os.path.splitext(base)[0]\n",
    "    parts = name_no_ext.split('_')\n",
    "    \n",
    "    if len(parts) < 6: \n",
    "        return None\n",
    "\n",
    "    raw_penalty = \"_\".join(parts[5:])\n",
    "    return {\n",
    "        'model': parts[4],\n",
    "        'penalty': PENALTY_MAPPING.get(raw_penalty, raw_penalty)\n",
    "    }\n",
    "\n",
    "def process_files(folder_path):\n",
    "    \"\"\"Aggregates and processes result files.\"\"\"\n",
    "    results_list = []\n",
    "    files = glob.glob(os.path.join(folder_path, '*'))\n",
    "    \n",
    "    for f in files:\n",
    "        if os.path.isdir(f) or not (f.endswith('.csv') or f.endswith('.txt')):\n",
    "            continue\n",
    "            \n",
    "        meta = parse_filename(f)\n",
    "        if not meta: continue\n",
    "        \n",
    "        try:\n",
    "            # Rigorous column selection\n",
    "            df = pd.read_csv(f, usecols=['AUROC', 'AUPRC'])\n",
    "            \n",
    "            entry = meta.copy()\n",
    "            entry.update({\n",
    "                'AUROC': df['AUROC'].max(), \n",
    "                'AUPRC': df['AUPRC'].max()\n",
    "            })\n",
    "            results_list.append(entry)\n",
    "        except Exception as e:\n",
    "            print(f\"File Error: Skipping {f} - {e}\")\n",
    "\n",
    "    return pd.DataFrame(results_list)\n",
    "\n",
    "def generate_comparative_latex(df, caption, label):\n",
    "    \"\"\"Generates a professionally formatted LaTeX table.\"\"\"\n",
    "    # Group and aggregate for statistical reporting\n",
    "    df_agg = df.groupby(['model', 'penalty'])[['AUROC', 'AUPRC']].agg(['mean', 'std'])\n",
    "    \n",
    "    latex = [\n",
    "        r\"\\begin{table*}[ht]\",\n",
    "        r\"    \\centering\",\n",
    "        f\"    \\\\caption{{{caption}}}\",\n",
    "        f\"    \\\\label{{{label}}}\",\n",
    "        r\"    \\providecommand{\\res}[2]{\\begin{tabular}{@{}c@{}}#1\\\\[-3pt]{\\scriptsize (#2)}\\end{tabular}}\",\n",
    "        r\"    \\resizebox{0.9\\textwidth}{!}{%\",\n",
    "        r\"    \\begin{tabular}{@{} l \" + \"c\" * len(COLUMN_ORDER) + \" | \" + \"c\" * len(COLUMN_ORDER) + \" @{}}\",\n",
    "        r\"        \\toprule\",\n",
    "        r\"        \\multirow{2}{*}{Model} & \\multicolumn{\" + str(len(COLUMN_ORDER)) + r\"}{c}{AUROC} & \\multicolumn{\" + str(len(COLUMN_ORDER)) + r\"}{c}{AUPRC} \\\\\",\n",
    "        r\"        \\cmidrule(lr){2-\" + str(len(COLUMN_ORDER)+1) + r\"} \\cmidrule(lr){\" + str(len(COLUMN_ORDER)+2) + r\"-\" + str(2*len(COLUMN_ORDER)+1) + r\"}\",\n",
    "        \"         & \" + \" & \".join(COLUMN_ORDER) + \" & \" + \" & \".join(COLUMN_ORDER) + r\" \\\\\",\n",
    "        r\"        \\midrule\"\n",
    "    ]\n",
    "\n",
    "    for model in MODEL_ORDER:\n",
    "        if model not in df_agg.index.get_level_values('model'):\n",
    "            continue\n",
    "        \n",
    "        row = [f\"        {escape_tex(model)}\"]\n",
    "        \n",
    "        for metric in ['AUROC', 'AUPRC']:\n",
    "            for pen in COLUMN_ORDER:\n",
    "                try:\n",
    "                    mean_val = df_agg.loc[(model, pen), (metric, 'mean')]\n",
    "                    std_val = df_agg.loc[(model, pen), (metric, 'std')]\n",
    "                    row.append(f\"\\\\res{{{mean_val:.3f}}}{{{std_val:.3f}}}\")\n",
    "                except KeyError:\n",
    "                    row.append(\"--\")\n",
    "        \n",
    "        latex.append(\" & \".join(row) + r\" \\\\\")\n",
    "\n",
    "    latex.extend([\n",
    "        r\"        \\bottomrule\",\n",
    "        r\"    \\end{tabular}%\",\n",
    "        r\"    }\",\n",
    "        r\"\\end{table*}\"\n",
    "    ])\n",
    "    \n",
    "    return \"\\n\".join(latex)\n",
    "\n",
    "if __name__ == \"__main__\":\n",
    "    df_results = process_files(FOLDER_PATH)\n",
    "\n",
    "    if not df_results.empty:\n",
    "        # Save results to the specified CSV\n",
    "        # df_results.to_csv(OUTPUT_FILE['csv'], index=False)\n",
    "        \n",
    "        # Generate and save the TeX table\n",
    "        tex_output = generate_comparative_latex(\n",
    "            df_results, \n",
    "            caption=\"Comparison of performance metrics across penalty configurations.\",\n",
    "            label=\"tab:performance_summary\"\n",
    "        )\n",
    "        \n",
    "        # with open(OUTPUT_FILE['tex'], 'w') as f:\n",
    "        #     f.write(tex_output)\n",
    "        \n",
    "        print(tex_output)\n",
    "        print(f\"Success: Processed {len(df_results)} records.\")\n",
    "        print(f\"Outputs: {OUTPUT_FILE['csv']}, {OUTPUT_FILE['tex']}\")\n",
    "    else:\n",
    "        print(\"Error: No data found. Check your FOLDER_PATH and filename patterns.\")"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "MPS",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
