{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "69746215",
   "metadata": {},
   "source": [
    "## Table Aggregation: BGP Synthesis Time\n",
    "\n",
    "In this notebook we aggregate the raw data into tables on BGP/OSPF synthesis time as used in our figures"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "22dcb06c",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "def get_neural_files(basedir): return dict([[int(f.split(\"-\")[2]), basedir + f] for f in os.listdir(basedir) if f.startswith(\"bgp-reqs\")])\n",
    "neural_files = get_neural_files(\"results/\")\n",
    "nc_files = dict([[int(f.split(\"-\")[2][:-len(\"result\")]), \"./netcomplete/results/\" + f] for f in os.listdir(\"./netcomplete/results/\") if f.startswith(\"bgp-reqs\")])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "09d2a39c",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "id": "29c0f457",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "                 time  num_timeouts  samples  min_nodes  max_nodes\n",
      "bucket                                                            \n",
      "0 Small     18.072854             0        8          0          7\n",
      "1 Medium    60.864079             0        8          8         15\n",
      "2 Large   1389.484829             7        8         16         23\n"
     ]
    }
   ],
   "source": [
    "TIMEOUT_VALUE = 999\n",
    "\n",
    "def read_results_file(f, with_consistency=False):\n",
    "    df = pd.read_csv(f, sep=\";\", names=[\"prefix\", \"time\"] + ([\"consistency\"] if with_consistency else []))\n",
    "    \n",
    "    df[\"num_nodes\"] = [int(p[len(\"bgp-n\"):]) for p in df[\"prefix\"].values]\n",
    "    num_samples_per_category = 8\n",
    "    \n",
    "    def bucket(n):\n",
    "        if n < num_samples_per_category: return \"0 Small\"\n",
    "        if n < num_samples_per_category*2: return \"1 Medium\"\n",
    "        return \"2 Large\"\n",
    "    df[\"bucket\"] = [bucket(n) for n in df[\"num_nodes\"]]\n",
    "    \n",
    "    df_with_timeouts = pd.DataFrame(df)\n",
    "    df_with_timeouts[\"num_timeouts\"] = df[\"time\"].values == TIMEOUT_VALUE\n",
    "    \n",
    "    #df = df[df[\"time\"] != 999]\n",
    "    df[\"time\"] = (df[\"time\"] == TIMEOUT_VALUE) * 1500 + (df[\"time\"] != TIMEOUT_VALUE) * df[\"time\"]\n",
    "    \n",
    "    if with_consistency:\n",
    "        df[\"full_match\"] = df[\"consistency\"].values == 1.0\n",
    "    \n",
    "    counts = df.groupby(\"bucket\").count()[\"num_nodes\"]\n",
    "    res = df.groupby(\"bucket\").mean()\n",
    "    del res[\"num_nodes\"]\n",
    "    res[\"samples\"] = counts\n",
    "    res[\"min_nodes\"] = df.groupby(\"bucket\").min()[\"num_nodes\"]\n",
    "    res[\"max_nodes\"] = df.groupby(\"bucket\").max()[\"num_nodes\"]\n",
    "    res[\"num_timeouts\"] = df_with_timeouts.groupby(\"bucket\").sum()[\"num_timeouts\"]\n",
    "    \n",
    "    return res\n",
    "#print(read_results_file(\"bgp/neural/bgp-reqs-2-result-bgp-2021-09-15_11:25:18.csv\", with_consistency=True))\n",
    "print(read_results_file(nc_files[2]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "a7ec01d3",
   "metadata": {},
   "outputs": [],
   "source": [
    "system_name = \"Neural\"\n",
    "consistency_col = \"Consistency (Neural)\"\n",
    "full_match_col = \"Full Match (Neural)\"\n",
    "\n",
    "def merge(df_netcomplete, df_neural):\n",
    "    res = pd.DataFrame(df_netcomplete)\n",
    "        \n",
    "    res[\"NetComplete\"] = df_netcomplete[\"time\"]\n",
    "    res[\"NetComplete Timeouts\"] = df_netcomplete[\"num_timeouts\"]\n",
    "    res[system_name] = df_neural[\"time\"]\n",
    "    res[consistency_col] = df_neural[\"consistency\"]\n",
    "    res[full_match_col] = df_neural[\"full_match\"]\n",
    "    del res[\"time\"]\n",
    "    \n",
    "    speedup_factors = res[\"NetComplete\"].values / res[system_name].values\n",
    "    res[\"Speedup\"] = [\"%.1fx\" % f for f in speedup_factors]\n",
    "    \n",
    "    res = res.reset_index()\n",
    "    \n",
    "    return res[[\"bucket\", \"NetComplete\", \"Neural\", \"Speedup\", \"NetComplete Timeouts\", consistency_col, full_match_col]]"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "053df4c0",
   "metadata": {},
   "source": [
    "## 2 Requirements"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "4a7bb5b8",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>bucket</th>\n",
       "      <th>NetComplete</th>\n",
       "      <th>Neural</th>\n",
       "      <th>Speedup</th>\n",
       "      <th>NetComplete Timeouts</th>\n",
       "      <th>Consistency (Neural)</th>\n",
       "      <th>Full Match (Neural)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0 Small</td>\n",
       "      <td>18.072854</td>\n",
       "      <td>0.640729</td>\n",
       "      <td>28.2x</td>\n",
       "      <td>0</td>\n",
       "      <td>0.968750</td>\n",
       "      <td>0.875</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1 Medium</td>\n",
       "      <td>60.864079</td>\n",
       "      <td>2.747783</td>\n",
       "      <td>22.2x</td>\n",
       "      <td>0</td>\n",
       "      <td>0.939236</td>\n",
       "      <td>0.750</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2 Large</td>\n",
       "      <td>1389.484829</td>\n",
       "      <td>22.300895</td>\n",
       "      <td>62.3x</td>\n",
       "      <td>7</td>\n",
       "      <td>0.988636</td>\n",
       "      <td>0.875</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     bucket  NetComplete     Neural Speedup  NetComplete Timeouts  \\\n",
       "0   0 Small    18.072854   0.640729   28.2x                     0   \n",
       "1  1 Medium    60.864079   2.747783   22.2x                     0   \n",
       "2   2 Large  1389.484829  22.300895   62.3x                     7   \n",
       "\n",
       "   Consistency (Neural)  Full Match (Neural)  \n",
       "0              0.968750                0.875  \n",
       "1              0.939236                0.750  \n",
       "2              0.988636                0.875  "
      ]
     },
     "execution_count": 31,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "req2 = merge(\n",
    "    read_results_file(nc_files[2]),\n",
    "    read_results_file(neural_files[2], with_consistency=True),\n",
    ")\n",
    "req2"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "460d886b",
   "metadata": {},
   "source": [
    "## 8 Requirements"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "6c7b6ee1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>bucket</th>\n",
       "      <th>NetComplete</th>\n",
       "      <th>Neural</th>\n",
       "      <th>Speedup</th>\n",
       "      <th>NetComplete Timeouts</th>\n",
       "      <th>Consistency (Neural)</th>\n",
       "      <th>Full Match (Neural)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0 Small</td>\n",
       "      <td>247.690651</td>\n",
       "      <td>1.065172</td>\n",
       "      <td>232.5x</td>\n",
       "      <td>0</td>\n",
       "      <td>0.960000</td>\n",
       "      <td>0.75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1 Medium</td>\n",
       "      <td>1500.000000</td>\n",
       "      <td>3.470269</td>\n",
       "      <td>432.2x</td>\n",
       "      <td>8</td>\n",
       "      <td>0.967839</td>\n",
       "      <td>0.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2 Large</td>\n",
       "      <td>1500.000000</td>\n",
       "      <td>30.961408</td>\n",
       "      <td>48.4x</td>\n",
       "      <td>8</td>\n",
       "      <td>0.969444</td>\n",
       "      <td>0.75</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     bucket  NetComplete     Neural Speedup  NetComplete Timeouts  \\\n",
       "0   0 Small   247.690651   1.065172  232.5x                     0   \n",
       "1  1 Medium  1500.000000   3.470269  432.2x                     8   \n",
       "2   2 Large  1500.000000  30.961408   48.4x                     8   \n",
       "\n",
       "   Consistency (Neural)  Full Match (Neural)  \n",
       "0              0.960000                 0.75  \n",
       "1              0.967839                 0.50  \n",
       "2              0.969444                 0.75  "
      ]
     },
     "execution_count": 32,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "req8 = merge(\n",
    "    read_results_file(nc_files[8]),\n",
    "    read_results_file(neural_files[8], with_consistency=True),\n",
    ")\n",
    "req8"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "c5c70c33",
   "metadata": {},
   "source": [
    "## 16 Requirements"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "33b30719",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>bucket</th>\n",
       "      <th>NetComplete</th>\n",
       "      <th>Neural</th>\n",
       "      <th>Speedup</th>\n",
       "      <th>NetComplete Timeouts</th>\n",
       "      <th>Consistency (Neural)</th>\n",
       "      <th>Full Match (Neural)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0 Small</td>\n",
       "      <td>1416.828196</td>\n",
       "      <td>2.527836</td>\n",
       "      <td>560.5x</td>\n",
       "      <td>7</td>\n",
       "      <td>0.925770</td>\n",
       "      <td>0.25</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1 Medium</td>\n",
       "      <td>1500.000000</td>\n",
       "      <td>5.481253</td>\n",
       "      <td>273.7x</td>\n",
       "      <td>8</td>\n",
       "      <td>0.947115</td>\n",
       "      <td>0.25</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2 Large</td>\n",
       "      <td>1500.000000</td>\n",
       "      <td>69.092142</td>\n",
       "      <td>21.7x</td>\n",
       "      <td>8</td>\n",
       "      <td>0.958699</td>\n",
       "      <td>0.25</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     bucket  NetComplete     Neural Speedup  NetComplete Timeouts  \\\n",
       "0   0 Small  1416.828196   2.527836  560.5x                     7   \n",
       "1  1 Medium  1500.000000   5.481253  273.7x                     8   \n",
       "2   2 Large  1500.000000  69.092142   21.7x                     8   \n",
       "\n",
       "   Consistency (Neural)  Full Match (Neural)  \n",
       "0              0.925770                 0.25  \n",
       "1              0.947115                 0.25  \n",
       "2              0.958699                 0.25  "
      ]
     },
     "execution_count": 33,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "req16 = merge(\n",
    "    read_results_file(nc_files[16]),\n",
    "    read_results_file(neural_files[16], with_consistency=True),\n",
    ")\n",
    "req16"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "68b33c6c",
   "metadata": {},
   "source": [
    "## Format as LaTex table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "0865343f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\midrule\n",
      "2 requirements &Small & 18.073s & \\textbf{0.641s} & 28.2x & 0.969 & 0.875\\\\\n",
      " &Medium & 60.864s & \\textbf{2.748s} & 22.2x & 0.939 & 0.75\\\\\n",
      " &Large & 1389.485s\\tiny{  7/8 TO} & \\textbf{22.301s} & 62.3x & 0.989 & 0.875\\\\\n",
      "\\midrule\n",
      "8 requirements &Small & 247.691s & \\textbf{1.065s} & 232.5x & 0.96 & 0.75\\\\\n",
      " &Medium & 1500s\\tiny{  8/8 TO} & \\textbf{3.47s} & 432.2x & 0.968 & 0.5\\\\\n",
      " &Large & 1500s\\tiny{  8/8 TO} & \\textbf{30.961s} & 48.4x & 0.969 & 0.75\\\\\n",
      "\\midrule\n",
      "16 requirements &Small & 1416.828s\\tiny{  7/8 TO} & \\textbf{2.528s} & 560.5x & 0.926 & 0.25\\\\\n",
      " &Medium & 1500s\\tiny{  8/8 TO} & \\textbf{5.481s} & 273.7x & 0.947 & 0.25\\\\\n",
      " &Large & 1500s\\tiny{  8/8 TO} & \\textbf{69.092s} & 21.7x & 0.959 & 0.25\\\\\n"
     ]
    }
   ],
   "source": [
    "import numpy as np\n",
    "\n",
    "reqs_counts = [2, 8, 16]\n",
    "\n",
    "for nreqs, reqs in zip(reqs_counts, [req2, req8, req16]):\n",
    "    print(\"\\\\midrule\")\n",
    "    for i, row in enumerate(reqs.iloc):\n",
    "        row = list(row.values)\n",
    "        num_timeouts = row[4]\n",
    "        del row[4]\n",
    "        def str_v(v, i):\n",
    "            if v == \"0 Small\": return \"Small\"\n",
    "            if v == \"1 Medium\": return \"Medium\"\n",
    "            if v == \"2 Large\": return \"Large\"\n",
    "            if type(v) is np.float64:\n",
    "                highlighted_indices = set([2])\n",
    "                res = \"\"\n",
    "                if i in highlighted_indices: res += \"\\\\textbf{\"\n",
    "                res += (\"%.3f\" % v).rstrip(\"0\").rstrip(\".\")\n",
    "                if i == 1 or i == 2: res += \"s\"\n",
    "                if i in highlighted_indices: res += \"}\"\n",
    "                \n",
    "                if i == 1: # NetComplete Time\n",
    "                    if num_timeouts > 0:\n",
    "                        res += \"\\\\tiny{\" + \"  {}/8 TO\".format(num_timeouts) + \"}\"\n",
    "                return res\n",
    "            else: return str(v)\n",
    "        row_values = [str_v(v, i) for i,v in enumerate(row)]\n",
    "            \n",
    "        prefix = \" &\"\n",
    "        if i == 0: prefix = \"{} requirements &\".format(nreqs)\n",
    "        print(prefix + \" & \".join(row_values) + \"\\\\\\\\\")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "bbd79feb",
   "metadata": {},
   "source": [
    "## GPU"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "4d7a3410",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\midrule\n",
      "2 requirements &Small & 18.073s & \\textbf{0.496s} & 36.4x & 0.969 & 0.875\\\\\n",
      " &Medium & 60.864s & \\textbf{0.676s} & 90.1x & 0.939 & 0.75\\\\\n",
      " &Large & 1389.485s\\tiny{  7/8 TO} & \\textbf{20.797s} & 66.8x & 0.989 & 0.875\\\\\n",
      "\\midrule\n",
      "8 requirements &Small & 247.691s & \\textbf{0.719s} & 344.7x & 0.96 & 0.75\\\\\n",
      " &Medium & 1500s\\tiny{  8/8 TO} & \\textbf{1.053s} & 1424.3x & 0.968 & 0.5\\\\\n",
      " &Large & 1500s\\tiny{  8/8 TO} & \\textbf{24.728s} & 60.7x & 0.969 & 0.75\\\\\n",
      "\\midrule\n",
      "16 requirements &Small & 1416.828s\\tiny{  7/8 TO} & \\textbf{1.296s} & 1093.0x & 0.922 & 0.125\\\\\n",
      " &Medium & 1500s\\tiny{  8/8 TO} & \\textbf{1.38s} & 1086.6x & 0.945 & 0.125\\\\\n",
      " &Large & 1500s\\tiny{  8/8 TO} & \\textbf{62.778s} & 23.9x & 0.963 & 0.25\\\\\n"
     ]
    }
   ],
   "source": [
    "neural_gpu_files = get_neural_files(\"./results/bgp-gpu/\")\n",
    "\n",
    "req2_gpu = merge(\n",
    "    read_results_file(nc_files[2]),\n",
    "    read_results_file(neural_gpu_files[2], with_consistency=True),\n",
    ")\n",
    "req8_gpu = merge(\n",
    "    read_results_file(nc_files[8]),\n",
    "    read_results_file(neural_gpu_files[8], with_consistency=True),\n",
    ")\n",
    "req16_gpu = merge(\n",
    "    read_results_file(nc_files[16]),\n",
    "    read_results_file(neural_gpu_files[16], with_consistency=True),\n",
    ")\n",
    "\n",
    "import numpy as np\n",
    "\n",
    "reqs_counts = [2, 8, 16]\n",
    "\n",
    "for nreqs, reqs in zip(reqs_counts, [req2_gpu, req8_gpu, req16_gpu]):\n",
    "    print(\"\\\\midrule\")\n",
    "    for i, row in enumerate(reqs.iloc):\n",
    "        row = list(row.values)\n",
    "        num_timeouts = row[4]\n",
    "        del row[4]\n",
    "        def str_v(v, i):\n",
    "            if v == \"0 Small\": return \"Small\"\n",
    "            if v == \"1 Medium\": return \"Medium\"\n",
    "            if v == \"2 Large\": return \"Large\"\n",
    "            if type(v) is np.float64:\n",
    "                highlighted_indices = set([2])\n",
    "                res = \"\"\n",
    "                if i in highlighted_indices: res += \"\\\\textbf{\"\n",
    "                res += (\"%.3f\" % v).rstrip(\"0\").rstrip(\".\")\n",
    "                if i == 1 or i == 2: res += \"s\"\n",
    "                if i in highlighted_indices: res += \"}\"\n",
    "                \n",
    "                if i == 1: # NetComplete Time\n",
    "                    if num_timeouts > 0:\n",
    "                        res += \"\\\\tiny{\" + \"  {}/8 TO\".format(num_timeouts) + \"}\"\n",
    "                return res\n",
    "            else: return str(v)\n",
    "        row_values = [str_v(v, i) for i,v in enumerate(row)]\n",
    "            \n",
    "        prefix = \" &\"\n",
    "        if i == 0: prefix = \"{} requirements &\".format(nreqs)\n",
    "        print(prefix + \" & \".join(row_values) + \"\\\\\\\\\")"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
