{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5d289e4e-8334-4cbd-9b3e-0eef2ab5fc9e",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "%reload_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7363774a-08a1-4536-bce0-19ffb9415952",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "import json\n",
    "import logging\n",
    "import typing as ty\n",
    "from IPython.display import display, HTML, Markdown, display_html\n",
    "from pathlib import Path\n",
    "from typing import Dict, List, Optional\n",
    "\n",
    "import matplotlib.pyplot as plt\n",
    "import networkx as nx\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import scipy.stats as stats\n",
    "\n",
    "import egr.pandas_helpers as ph\n",
    "import nb.reports.helpers as hlp\n",
    "import nb.reports.vis_helpers as vh\n",
    "from egr.util import load_graph\n",
    "from egr.log import init_logging\n",
    "\n",
    "LOG = logging.getLogger('report')\n",
    "\n",
    "init_logging(level_name='info')\n",
    "pd.set_option('display.precision', 2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4b850c0a-816e-4da8-b0ee-29927c246684",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "# RUN_ID: str = '230718-02'\n",
    "# VARIANT: str = 'p008-02'\n",
    "NUM_FOLDS: int = 10\n",
    "SAMPLES = ['0002']\n",
    "\n",
    "all_samples = [f'{i:04d}' for i in range(1, 6)]\n",
    "# control_rounds = ['rL', 'rP4', 'rR']\n",
    "control_rounds = ['rR']\n",
    "eegl_rounds = [f'r{i}' for i in range(7)]\n",
    "all_rounds = control_rounds + eegl_rounds\n",
    "data_root: Path = Path(f'./.output')\n",
    "# exp_root: Path = data_root / RUN_ID\n",
    "# fsg_args = dict(run_id=RUN_ID, tags=eegl_rounds)\n",
    "num_features: int = 10\n",
    "ncols: int = num_features"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f77a992e-4965-4bf6-802b-0739a2e64785",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "from itertools import chain,cycle\n",
    "def display_side_by_side(*args,titles=cycle([''])):\n",
    "    html_str=''\n",
    "    for df,title in zip(args, chain(titles,cycle(['</br>'])) ):\n",
    "        html_str+='<th style=\"text-align:center\"><td style=\"vertical-align:top\">'\n",
    "        html_str+=f'<h2 style=\"text-align: center;\">{title}</h2>'\n",
    "        html_str+=df.to_html().replace('table','table style=\"display:inline\"')\n",
    "        html_str+='</td></th>'\n",
    "    display_html(html_str,raw=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "db138484-d6e9-41ae-9a5d-9517764f1fac",
   "metadata": {
    "jupyter": {
     "source_hidden": true
    },
    "tags": []
   },
   "outputs": [],
   "source": [
    "CSS = \"\"\"\n",
    ".output {\n",
    "    flex-direction: row;\n",
    "}\n",
    "\n",
    "h1 {\n",
    "    align-text: center;\n",
    "}\n",
    "\"\"\"\n",
    "\n",
    "HTML('<style>{}</style>'.format(CSS))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e723e641-4b20-4991-9e3e-618475c6b18f",
   "metadata": {
    "scrolled": true,
    "tags": []
   },
   "outputs": [],
   "source": [
    "def show(var: str, run_id: str, samples: ty.List[str], n_folds: int = 10):\n",
    "    exp_root = data_root / run_id\n",
    "    def mk_table(fold) -> pd.DataFrame:\n",
    "        return hlp.make_table(exp_root, samples, var, all_rounds, fold)\n",
    "\n",
    "    tables = [mk_table(fold + 1) for fold in range(n_folds)]\n",
    "    arrays = [df.to_numpy() for df in tables]\n",
    "\n",
    "    mean_df = ph.mean_df(tables)\n",
    "    sem = stats.sem(arrays, axis=0)\n",
    "    std = np.std(arrays, axis=0)\n",
    "\n",
    "    spec = hlp.get_variant_spec(var)\n",
    "    # display(Markdown(f'## <center>{spec.name}</center>'))\n",
    "    # display(Markdown(f'### <center>{spec.desc}: Folds: {n_folds}</center>'))\n",
    "    sem_df = pd.DataFrame(index=mean_df.index, columns=mean_df.columns)\n",
    "    sem_df_styler = sem_df.style.set_table_attributes(\"style='display:inline'\").set_caption('Standard Error of Mean')\n",
    "    \n",
    "    for r in range(mean_df.shape[0]):\n",
    "        for c in range(mean_df.shape[1]):\n",
    "            sem_df.iloc[r, c] = f'{mean_df.iloc[r, c]:.2f} $\\pm$ {sem[r, c]:.2f}'\n",
    "    \n",
    "    std_df = pd.DataFrame(index=mean_df.index, columns=mean_df.columns)\n",
    "    std_df_styler = std_df.style.set_table_attributes(\"style='display:inline'\").set_caption('Standard Deviation')\n",
    "    for r in range(mean_df.shape[0]):\n",
    "        for c in range(mean_df.shape[1]):\n",
    "            std_df.iloc[r, c] = f'{mean_df.iloc[r, c]:.2f} $\\pm$ {std[r, c]:.2f}'\n",
    "    \n",
    "    return sem_df['F1-Score'], std_df['F1-Score']\n",
    "    \n",
    "display(Markdown('# <center>F1-Score All</center>'))\n",
    "display(Markdown('---'))\n",
    "\n",
    "variants = [\n",
    "    # ('p001-01', ['0001'], 10),\n",
    "    # ('p001-02', ['0001'], 10),\n",
    "    # ('p001-03', ['0001'], 10),\n",
    "    # ('p007-02', ['0001'], 10),\n",
    "    # ('p008-02', ['0001'], 10),\n",
    "    ('p009-02', ['0002'], 10),\n",
    "]\n",
    "\n",
    "iterations = [\n",
    "    ('1', '230718-01'),\n",
    "    ('2', '230718-02'),\n",
    "    ('3', '230718-03'),\n",
    "    ('4', '230718-04'),\n",
    "    ('5', '230718-05')\n",
    "]\n",
    "\n",
    "# columns=[hlp.get_variant_spec(v[0]).name for v in variants]\n",
    "columns = [idx for idx, _ in iterations]\n",
    "df_sem, df_std = pd.DataFrame(columns=columns), pd.DataFrame(columns=columns)\n",
    "for variant, samples, folds in variants:\n",
    "    for idx, name in iterations:\n",
    "        df_m, df_sd = show(variant, name, samples, n_folds=folds)\n",
    "        # df_sem[hlp.get_variant_spec(variant).name] = df_m\n",
    "        # df_std[hlp.get_variant_spec(variant).name] = df_sd\n",
    "        df_sem[str(idx)] = df_m\n",
    "        df_std[str(idx)] = df_sd\n",
    "    \n",
    "# df_sem.style.highlight_max(color='lightgreen', axis=0)\n",
    "# display(Markdown('### With Standard Error of Mean'))\n",
    "# display(df_sem)\n",
    "\n",
    "# display(Markdown('### With Standard Deviation'))\n",
    "# df_std.style.format(':.2f').to_latex(caption='SD', hrules=True)\n",
    "# display(df_std)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c54ab1f1-2b9d-4260-96b3-89a90ed8b176",
   "metadata": {},
   "outputs": [],
   "source": [
    "def make_ave_table(var: str, run_id: str, samples: ty.List[str], n_folds: int = 10):\n",
    "    exp_root = data_root / run_id\n",
    "    def mk_table(fold) -> pd.DataFrame:\n",
    "        return hlp.make_table(exp_root, samples, var, all_rounds, fold)\n",
    "    tables = [mk_table(fold + 1) for fold in range(n_folds)]\n",
    "    arrays = [df.to_numpy() for df in tables]\n",
    "    mean_df = ph.mean_df(tables)\n",
    "    return mean_df['F1-Score']\n",
    "\n",
    "all_df = pd.DataFrame()\n",
    "for idx, iter in iterations:\n",
    "    mean_df = make_ave_table(\n",
    "        'p009-02', \n",
    "        iter,\n",
    "        samples=['0002'], \n",
    "        n_folds=10)\n",
    "    all_df[idx] = mean_df\n",
    "\n",
    "ave_df, std_df = all_df.mean(axis=1), all_df.std(axis=1)\n",
    "final_df = pd.DataFrame(index=ave_df.index, columns=['$M_{2}^{\"}$'])\n",
    "\n",
    "for r in range(ave_df.shape[0]):\n",
    "    final_df.iloc[r, 0] = f'{ave_df[r]:.2f} $\\pm$ {std_df[r]:.2f}'\n",
    "\n",
    "# print(final_df.to_latex())\n",
    "display(final_df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "27dfc755-f866-4846-b240-79497ea77b38",
   "metadata": {},
   "outputs": [],
   "source": [
    "# display(multi_mean_df.mean(axis=1))"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8243bc55-d15f-4083-9109-c2dc4d732079",
   "metadata": {},
   "source": [
    "[<< All Reports](http://pods.evl.uic.edu/eegl/230510/main.html)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "52cc5ebf-193f-462d-895e-5b68bb930465",
   "metadata": {},
   "outputs": [],
   "source": [
    "display(multi_mean_df.std(axis=1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "700246ad-8cea-464d-ab9f-12df4de97a71",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
