{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import json\n",
    "import matplotlib\n",
    "import matplotlib.pyplot as plt\n",
    "import pandas as pd\n",
    "from collections import defaultdict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# def load_plot_setting():\n",
    "#     plt.style.use(\"seaborn-v0_8-talk\")\n",
    "#     plt.rcParams.update({\n",
    "#         \"axes.titlesize\": \"x-large\",\n",
    "#         \"axes.labelsize\": \"xx-large\",\n",
    "#     })\n",
    "#     os.makedirs(\"plots\", exist_ok=True)\n",
    "\n",
    "plt.rcParams.update({\n",
    "    \"axes.titlesize\": \"x-large\",\n",
    "    \"axes.labelsize\": \"x-large\",\n",
    "})\n",
    "# load_plot_setting()\n",
    "def setup():\n",
    "    os.makedirs(\"plots\", exist_ok=True)\n",
    "    linewidth = 3\n",
    "\n",
    "    styles = {\n",
    "        'retraining': {'label': 'RfS', 'linestyle': '-', 'color': 'tab:blue', 'linewidth': linewidth},\n",
    "        'mmt': {'label': 'MMT', 'linestyle': '-', 'color': 'tab:green', 'linewidth': linewidth},\n",
    "        'bmt': {'label': 'BMT', 'linestyle': '-', 'color': 'goldenrod', 'linewidth': linewidth},\n",
    "        'standalone': {'label': 'Standalone', 'linestyle': '-', 'color': 'tab:red', 'linewidth': linewidth},\n",
    "        'greedy': {'label': 'Greedy', 'color': 'tab:orange', 'linewidth': linewidth}\n",
    "    }\n",
    "    return styles\n",
    "\n",
    "plot_styles = setup() "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### MNIST heterogeneity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def prepare_data():\n",
    "    diff_p = [1.0, 0.5, 0.01]\n",
    "    data = {}\n",
    "\n",
    "    for p in diff_p:\n",
    "        diff_seeds = [1, 2, 3]\n",
    "        unlearn_methods = [\"retraining\", \"bmt\", \"mmt\"]\n",
    "\n",
    "        # aggregate results across different seeds\n",
    "        outputs = {}\n",
    "        for method in unlearn_methods:\n",
    "            res = []\n",
    "            for seed in diff_seeds:\n",
    "                path = f\"../main_results/data_heterogeneity/heterogeneity_new/seed-{seed}/niid-{p}/{method}/stats.json\"\n",
    "                print(f\"Loading stats from {path}\")\n",
    "                stats = json.load(open(path, \"r\"))\n",
    "                stats = pd.DataFrame(stats)     # convert to dataframe for easier aggregation\n",
    "                stats[\"index\"] = range(len(stats))  # create index for grouping\n",
    "                res.append(stats)\n",
    "            res = pd.concat(res).groupby(\"index\")   # group by index across different seeds\n",
    "            outputs[method] = {\"mean\": res.mean(), \"std\": res.std()}\n",
    "        \n",
    "        data[p] = outputs\n",
    "\n",
    "    return data\n",
    "\n",
    "all_data = prepare_data()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# def plot(ax, mean, std, label):\n",
    "#     ax.plot(mean, label=label, lw=3)\n",
    "#     ax.fill_between(range(len(mean)), mean-std, mean+std, alpha=.5)\n",
    "def plot(ax, x, mean, std, **kwargs):\n",
    "    color = kwargs.get(\"color\", None)\n",
    "    ax.plot(x, mean, **kwargs)\n",
    "    ax.fill_between(x, mean-std, mean+std, alpha=.4, facecolor=color)\n",
    "    return\n",
    "\n",
    "matplotlib.rcParams.update({'font.size': 16})\n",
    "fig, axs = plt.subplots(ncols=len(all_data), figsize=(7*len(all_data),5))\n",
    "fig.subplots_adjust(wspace=0.25)\n",
    "for i, (p, data) in enumerate(all_data.items()):\n",
    "    ax = axs[i]\n",
    "    metrics = \"test_acc\"\n",
    "    for method in data:\n",
    "        style = plot_styles[method]\n",
    "        mean = data[method][\"mean\"][metrics]\n",
    "        std = data[method][\"std\"][metrics]\n",
    "        x = mean.index\n",
    "        plot(ax, x, mean, std, markevery=80, **style)\n",
    "    \n",
    "\n",
    "    # plot(ax, data[\"retraining\"][\"mean\"][metrics], data[\"retraining\"][\"std\"][metrics], label=\"RfS\");\n",
    "    # plot(ax, data[\"bmt\"][\"mean\"][metrics], data[\"bmt\"][\"std\"][metrics], label=\"BMT\");\n",
    "    # plot(ax, data[\"mmt\"][\"mean\"][metrics], data[\"mmt\"][\"std\"][metrics], label=\"MMT\");\n",
    "    # plot(ax, data[\"sisa\"][\"mean\"][\"test_acc\"], data[\"sisa\"][\"std\"][\"test_acc\"], label=\"SISA\");\n",
    "    ax.legend(loc=\"lower left\");\n",
    "    ax.set_xlabel(\"Communication Rounds\", labelpad=15);\n",
    "    ax.set_ylabel(\"Test Accuracy\", labelpad=15);\n",
    "    ax.set_title(r\"$\\rho$\" + f\"={p}\")\n",
    "    ax.set_ylim(50,95);\n",
    "    \n",
    "fig.tight_layout()\n",
    "figure_name = \"outputs/mnist_heterogeneity.png\"\n",
    "plt.savefig(figure_name, bbox_inches=\"tight\", dpi=300)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "unlearning",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.4"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
