{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "69fc18ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e88292d6",
   "metadata": {},
   "outputs": [],
   "source": [
    "datasets = [\"barbell\", \"community\", \"erdosrenyi\", \"Ring\", \"Sensor\",\"torus\"]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5e77dfc4",
   "metadata": {},
   "outputs": [],
   "source": [
    "all_dfs = []\n",
    "path = \"../src/autoencoder/\"\n",
    "for dataset in datasets:\n",
    "    file_path = f\"{path}{dataset}_result.csv\"\n",
    "    df = pd.read_csv(file_path, header=None)\n",
    "    col = df.iloc[:,1]\n",
    "    df_nw = col.str.split(\" \\+\\- \", expand=True)\n",
    "    df_nw.columns = [\"mean\", \"std\"]\n",
    "    df_nw[\"method\"] = df.iloc[:,0]\n",
    "    df_nw = df_nw.iloc[[(m in ['DiffPool',\n",
    " 'MinCut',\n",
    " 'NMF',\n",
    " 'TopK',\n",
    " 'SAGPool',\n",
    " 'NDP',\n",
    " 'Graclus',\n",
    " 'SPREAD_EDGE_diffusion_distance']) for m in df_nw[\"method\"]],:]\n",
    "    all_dfs.append(df_nw)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c608def9",
   "metadata": {},
   "outputs": [],
   "source": [
    "all_dfs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fa9941ba",
   "metadata": {},
   "outputs": [],
   "source": [
    "this_order = ['SPREAD_EDGE_diffusion_distance', 'NDP',\n",
    " 'Graclus',\n",
    " 'NMF',\n",
    " 'TopK',\n",
    " 'SAGPool',\n",
    " 'DiffPool',\n",
    " 'MinCut'\n",
    " ]\n",
    "for df in all_dfs:\n",
    "    df[\"mean\"] = df[\"mean\"].astype(float).map(lambda x: f\"{x:.2e}\")\n",
    "    df[\"std\"] = df[\"std\"].astype(float).map(lambda x: f\"{x:.2e}\")\n",
    "    df[\"method\"] = pd.Categorical(df[\"method\"], categories=this_order, ordered=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "df2214c6",
   "metadata": {
    "vscode": {
     "languageId": "javascript"
    }
   },
   "outputs": [],
   "source": [
    "combined_df = pd.concat(all_dfs, keys=datasets, names=['dataset', 'row']).reset_index(level='dataset')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4076597b",
   "metadata": {
    "vscode": {
     "languageId": "javascript"
    }
   },
   "outputs": [],
   "source": [
    "combined_df[\"mean_and_std\"] = combined_df[\"mean\"] + \" ± \" + combined_df[\"std\"].astype(str)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8295df13",
   "metadata": {
    "vscode": {
     "languageId": "javascript"
    }
   },
   "outputs": [],
   "source": [
    "combined_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9412e84d",
   "metadata": {
    "vscode": {
     "languageId": "javascript"
    }
   },
   "outputs": [],
   "source": [
    "pivot_df = combined_df[[\"mean_and_std\", \"method\", \"dataset\"]]\n",
    "pivot_df = pivot_df.pivot(index=\"dataset\", columns=\"method\", values=\"mean_and_std\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "582ffcb8",
   "metadata": {
    "vscode": {
     "languageId": "javascript"
    }
   },
   "outputs": [],
   "source": [
    "pivot_df.T.to_csv(\"../plots/combined_ae_results.csv\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "889f40f6",
   "metadata": {
    "vscode": {
     "languageId": "javascript"
    }
   },
   "outputs": [],
   "source": [
    "pivot_df = combined_df[[\"mean\", \"method\", \"dataset\"]]\n",
    "pivot_df = pivot_df.pivot(index=\"dataset\", columns=\"method\", values=\"mean\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7ac2ab31",
   "metadata": {
    "vscode": {
     "languageId": "javascript"
    }
   },
   "outputs": [],
   "source": [
    "ranks = pivot_df.T\n",
    "ranks = ranks.to_numpy()\n",
    "ranks = pd.DataFrame(ranks, index=pivot_df.columns, columns=pivot_df.index)\n",
    "ranks = ranks.rank(axis=0, ascending=False)\n",
    "ranks.mean(axis=1).round(2)#.values"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "vscode": {
     "languageId": "javascript"
    }
   },
   "outputs": [],
   "source": [
    "ranks"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7832a003",
   "metadata": {
    "vscode": {
     "languageId": "javascript"
    }
   },
   "outputs": [],
   "source": [
    "pivot_df.T"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": ".venv",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
