{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "%load_ext autoreload\n",
    "%autoreload 2\n",
    "\n",
    "import numpy as np\n",
    "from numpy.core.multiarray import result_type\n",
    "import sys\n",
    "\n",
    "code_path = '/home/ec2-user/PycharmProjects/facility_location_with_predictions'\n",
    "if code_path not in sys.path:\n",
    "    sys.path.append(code_path)\n",
    "\n",
    "from run_experiments import run_experiment\n",
    "from itertools import product\n",
    "import polars as pl\n",
    "import multiprocessing as mp\n",
    "import numpy as np\n",
    "import pickle"
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Set Parameters."
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "code",
   "source": [
    "\n",
    "num_trials = 300\n",
    "num_elems = 100\n",
    "num_sets = 10000\n",
    "fp_rates = [0.0, 0.005, 0.02]\n",
    "fn_rates = [0.0, 0.15, 0.3]\n",
    "connection_probability=0.02"
   ],
   "metadata": {
    "collapsed": false
   },
   "execution_count": null,
   "outputs": []
  },
  {
   "cell_type": "markdown",
   "source": [
    "Run experiment to get a dataframe of results."
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "outputs": [],
   "source": [
    "df_list = []\n",
    "num_proc = 20\n",
    "with mp.Pool(num_proc) as pool:\n",
    "    result_obj_dict = {}\n",
    "    for fp, fn in product(fp_rates, fn_rates):\n",
    "        result_obj_dict[(fp, fn)] = []\n",
    "        for trail_num in range(num_trials):\n",
    "            result_obj_dict[(fp, fn)].append(pool.apply_async(\n",
    "                run_experiment_ab_prediction,\n",
    "                kwds={'seed': trail_num,\n",
    "                      'false_neg_rate': fn,\n",
    "                      'false_pos_rate': fp,\n",
    "                      'num_elems': num_elems,\n",
    "                      'num_sets': num_sets,\n",
    "                      'connection_probability' : connection_probability}\n",
    "            ))\n",
    "\n",
    "    # print (result_obj_dict)\n",
    "    i = 0\n",
    "    for rate_pair, result_obj_list in result_obj_dict.items():\n",
    "        fp_rate, fn_rate = rate_pair\n",
    "        for result_obj in result_obj_list:\n",
    "            df_list.append(result_obj.get().select([\n",
    "                pl.lit(fp_rate).alias('fp rate'),\n",
    "                pl.lit(fn_rate).alias('fn rate'),\n",
    "                pl.all()\n",
    "            ]))\n",
    "            print(i)\n",
    "            i += 1\n",
    "result_df = pl.concat(df_list)\n",
    "\n",
    "\n",
    "\n"
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "markdown",
   "source": [
    "Write results to pickle."
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "outputs": [],
   "source": [
    "with open(f'all_results_exp1_{num_sets}_{num_elems}_{connection_probability}.pkl', 'wb') as f:\n",
    "    pickle.dump(result_df, f)"
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "markdown",
   "source": [
    "# Analysis"
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "markdown",
   "source": [
    "Load results from pickle."
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "outputs": [],
   "source": [
    "with open(f'all_results_exp1_{num_sets}_{num_elems}_{connection_probability}.pkl', 'rb') as f:\n",
    "    result_df = pickle.load(f)\n",
    "print(result_df)"
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "markdown",
   "source": [
    "Calculate competitive ratio, and get mean and standard deviation."
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "outputs": [],
   "source": [
    "comp_ratio_cols = ['general online comp ratio',\n",
    "                   'prediction online comp ratio',\n",
    "                   'standard combination comp ratio',\n",
    "                   'smooth combination comp ratio']\n",
    "grouped_df_expectation_of_ratio = result_df.select([\n",
    "    pl.col('fp rate'),\n",
    "    pl.col('fn rate'),\n",
    "    (pl.col('general online') / pl.col('offline')).alias('general online comp ratio'),\n",
    "    (pl.col('prediction online') / pl.col('offline')).alias('prediction online comp ratio'),\n",
    "    (pl.col('standard combination') / pl.col('offline')).alias('standard combination comp ratio'),\n",
    "    (pl.col('smooth combination') / pl.col('offline')).alias('smooth combination comp ratio')\n",
    "]).groupby(['fp rate', 'fn rate']).agg(\n",
    "    [pl.format('{} ({})',\n",
    "               pl.col(name).mean().apply(lambda x: f'{x:.3f}'),\n",
    "               pl.col(name).std().apply(lambda x: f'{x:.3f}')) for name in comp_ratio_cols]\n",
    ").sort(['fp rate', 'fn rate'])\n",
    "grouped_df_expectation_of_ratio"
   ],
   "metadata": {
    "collapsed": false
   }
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "outputs": [],
   "source": [
    "latex_table = grouped_df_expectation_of_ratio.select([\n",
    "    'fp rate',\n",
    "    'fn rate',\n",
    "    'general online comp ratio',\n",
    "    'prediction online comp ratio',\n",
    "    'standard combination comp ratio',\n",
    "    'smooth combination comp ratio'\n",
    "])\n",
    "\n",
    "print(latex_table.select(pl.all()).to_pandas().to_latex(index=False, column_format='cccccc'))"
   ],
   "metadata": {
    "collapsed": false
   }
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 2
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython2",
   "version": "2.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 0
}
