{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "62863503-060b-48b8-b769-bddb194a074d",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "from glob import glob\n",
    "from scipy import stats"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "0a11c8b9-5e73-44ba-a158-91b05aea2326",
   "metadata": {},
   "outputs": [],
   "source": [
    "eps = [0.125, 2.0, 8.0]\n",
    "N = [12,24,36,48,60,72,84,96,108,120]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "541c14b8-1109-4fe1-bd28-9bc15c495dd1",
   "metadata": {},
   "outputs": [],
   "source": [
    "def computeCI(data_list, alpha=0.05):\n",
    "    '''\n",
    "    This function computes the 100*(1-alpha)% Confidence Interval for the true mean based\n",
    "    on n observations given a list.\n",
    "    '''\n",
    "    # Convert list to numpy array\n",
    "    data = np.array(data_list)\n",
    "    n = len(data)\n",
    "    \n",
    "    # Calculate mean and standard error\n",
    "    mean = np.mean(data)\n",
    "    std = np.std(data, ddof=1)  # Sample std (using Bessel's correction with ddof=1)\n",
    "    se = std / np.sqrt(n)\n",
    "    \n",
    "    # Calculate confidence interval using t-distribution\n",
    "    df = n - 1\n",
    "    t_critical = stats.t.ppf(1 - alpha/2, df)\n",
    "    margin = t_critical * se\n",
    "    \n",
    "    return mean, margin"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "60881d3e-a342-48d8-850a-ca9d82b0e637",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "EPSILON 0.125 - Initial: 8.65e-02 pm 8.18e-03 Optimized: 1.55e-02 pm 9.72e-04 Benchmark: 1.62e-02 pm 5.34e-03\n",
      "Relative Error Reduction: 82.09 %\n",
      "Average Running Time: 20.6 min.\n",
      "EPSILON 2.0 - Initial: 8.76e-02 pm 8.63e-03 Optimized: 1.29e-02 pm 1.20e-03 Benchmark: 1.24e-02 pm 2.69e-03\n",
      "Relative Error Reduction: 85.26 %\n",
      "Average Running Time: 26.7 min.\n",
      "EPSILON 8.0 - Initial: 9.09e-02 pm 4.39e-03 Optimized: 1.13e-02 pm 1.33e-03 Benchmark: 1.16e-02 pm 2.26e-03\n",
      "Relative Error Reduction: 87.53 %\n",
      "Average Running Time: 26.1 min.\n"
     ]
    }
   ],
   "source": [
    "# Table 3 - error with N=120\n",
    "for ep in eps:\n",
    "    InitialModel_relativeOODerror = []\n",
    "    OptimizedModel_relativeOODerror = []\n",
    "    benchmark_relativeOODerror = []\n",
    "    times = []\n",
    "    for k in range(10):\n",
    "        df = pd.read_csv(f'training_log_eps{ep}N{120}/training_log_{k}.csv')\n",
    "        InitialModel_relativeOODerror.append(np.sqrt(df['Relative_OOD_Error'][0]))\n",
    "        OptimizedModel_relativeOODerror.append(np.sqrt(df['Relative_OOD_Error'].iloc[-1]))\n",
    "        benchmark_relativeOODerror.append(np.sqrt(df['Relative_Benchmark_OOD'][0]))\n",
    "        times.append(df['Time (s)'].iloc[-1])\n",
    "    init_mean, init_margin = computeCI(InitialModel_relativeOODerror)\n",
    "    op_mean, op_margin = computeCI(OptimizedModel_relativeOODerror)\n",
    "    bench_mean, bench_margin = computeCI(benchmark_relativeOODerror)\n",
    "    time_mean, _ = computeCI(times)\n",
    "    print(f'EPSILON {ep} - Initial: {init_mean:.2e} pm {init_margin:.2e}',\n",
    "          f'Optimized: {op_mean:.2e} pm {op_margin:.2e}',\n",
    "          f'Benchmark: {bench_mean:.2e} pm {bench_margin:.2e}')\n",
    "    print('Relative Error Reduction:',round(100*(init_mean - op_mean)/init_mean,2),'%')\n",
    "    print('Average Running Time:',round(time_mean/60,1), \"min.\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "59fb7041-bd62-4cdc-a4c2-ceac7d4a331e",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total Compute Time: 27 hrs\n"
     ]
    }
   ],
   "source": [
    "# Total experiment runtime\n",
    "# The epsilon experiments ran in parallel with \n",
    "# epsilon=2 taking the longest taking 27 hours\n",
    "total_compute_time = 0\n",
    "for n in N:\n",
    "    times = []\n",
    "    for k in range(10):\n",
    "        df = pd.read_csv(f'training_log_eps{eps[1]}N{n}/training_log_{k}.csv')\n",
    "        times.append(df['Time (s)'].iloc[-1])\n",
    "    total_compute_time += sum(times)\n",
    "print('Total Compute Time:', round(total_compute_time/3600), 'hrs')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "aea36e9c-0221-47fa-ae43-34bbc93c90ec",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
