{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "71dc7768",
   "metadata": {},
   "source": [
    "# Parking Permit Problem Experiments\n",
    "In this notebook, we empirically test our online algorithms for the Parking Permit Problem (PPP) using New York City Weather Data from between 1869 and 2022 (dataset: https://www.kaggle.com/datasets/danbraswell/new-york-city-weather-18692022?resource=download)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "bacaccc6",
   "metadata": {},
   "outputs": [],
   "source": [
    "# load necessary libraries\n",
    "\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from tqdm import tqdm\n",
    "from src.ParkingPermitProblem import DualAugmentedSolver, OnlineDeterministicSolver, OnlineRandomizedSolver"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ced88331",
   "metadata": {},
   "outputs": [],
   "source": [
    "# load NYC Central Park Weather Data\n",
    "\n",
    "data = pd.read_csv(\"data/NYC_Central_Park_Weather.csv\")\n",
    "data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8b12734c",
   "metadata": {},
   "outputs": [],
   "source": [
    "# add column indicating whether it rained that day\n",
    "\n",
    "data['RAINED'] = (data['PRCP'] > 0.0).astype(int)\n",
    "data.head()\n",
    "\n",
    "# add YEAR, MONTH, DAY columns and remove leap days and incomplete year 2022\n",
    "\n",
    "data['YEAR'] = pd.to_datetime(data['DATE']).dt.year\n",
    "data['MONTH'] = pd.to_datetime(data['DATE']).dt.month\n",
    "data['DAY'] = pd.to_datetime(data['DATE']).dt.day\n",
    "data = data[~((data['MONTH'] == 2) & (data['DAY'] == 29))] # remove leap days\n",
    "data = data[~((data['YEAR'] == 2022))] # remove incomplete year 2022"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "85adef54",
   "metadata": {},
   "outputs": [],
   "source": [
    "# process data into yearly instances for PPP\n",
    "\n",
    "T = 365\n",
    "num_years = int(len(data)/T)  # check number of years\n",
    "\n",
    "all_data = np.zeros((num_years, T), dtype=int)\n",
    "\n",
    "for year in range(num_years):\n",
    "    yearly_data = data.iloc[year*T:(year+1)*T]\n",
    "    all_data[year, :] = yearly_data['RAINED'].values\n",
    "\n",
    "all_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a3f5d5de",
   "metadata": {},
   "outputs": [],
   "source": [
    "# parameters for PPP instance\n",
    "num_permits = 9\n",
    "cost_discount = 1.1 # discount factor for permit costs\n",
    "\n",
    "\n",
    "durations = np.array([int(2**i) for i in range(num_permits)])  # costs of permits\n",
    "costs = np.array([(2 / cost_discount)**i for i in range(num_permits)])\n",
    "\n",
    "def get_dual_predictions(all_data, costs, durations):\n",
    "    num_years, T = all_data.shape\n",
    "\n",
    "    dual_predictions = np.zeros((num_years, T), dtype=float)\n",
    "    solverAugmented = DualAugmentedSolver(alpha=0.5)\n",
    "    solverAugmented.setPermitTypes(costs, durations)\n",
    "\n",
    "    for year in range(num_years):\n",
    "\n",
    "        request_sequence = all_data[year, :]\n",
    "        solverAugmented.setInstance(request_sequence)\n",
    "        _, dual_vars, _ = solverAugmented.calculateOptimalCostLaminar()\n",
    "        dual_predictions[year, : ] = dual_vars\n",
    "\n",
    "    return np.mean(dual_predictions, axis=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4b9eb183",
   "metadata": {},
   "outputs": [],
   "source": [
    "def threeRatios(costs, durations, training_data, instance, alpha=0.5):\n",
    "    solverAugmented = DualAugmentedSolver(alpha)\n",
    "    solverAugmented.setPermitTypes(costs, durations)\n",
    "\n",
    "    optimal_dual = get_dual_predictions(training_data, costs, durations)\n",
    "    solverAugmented.setDualPredictions(optimal_dual)\n",
    "    solverAugmented.setInstance(instance)\n",
    "    ratio_augmented = solverAugmented.competitiveRatioNonLaminar()\n",
    "\n",
    "    solverDeterministic = OnlineDeterministicSolver()\n",
    "    solverDeterministic.setPermitTypes(costs, durations)\n",
    "    solverDeterministic.setInstance(instance)\n",
    "    ratio_deterministic = solverDeterministic.competitiveRatioNonLaminar()\n",
    "\n",
    "    solverRandomized = OnlineRandomizedSolver()\n",
    "    solverRandomized.setPermitTypes(costs, durations)\n",
    "    solverRandomized.setInstance(instance)\n",
    "    ratio_randomized = solverRandomized.competitiveRatioNonLaminar()\n",
    "\n",
    "    return ratio_augmented, ratio_deterministic, ratio_randomized\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "60542029",
   "metadata": {},
   "outputs": [],
   "source": [
    "# experiment involving varying n factor, over all test samples\n",
    "\n",
    "n = np.arange(2, 10)\n",
    "ratios_augmented = np.zeros(len(n))\n",
    "ratios_deterministic = np.zeros(len(n))\n",
    "ratios_randomized = np.zeros(len(n))\n",
    "\n",
    "num_years = all_data.shape[0]\n",
    "\n",
    "augmented_competitive_ratios = np.zeros((len(n), num_years))\n",
    "deterministic_competitive_ratios = np.zeros((len(n), num_years))\n",
    "randomized_competitive_ratios = np.zeros((len(n), num_years))\n",
    "\n",
    "for idx, num_permits in tqdm(enumerate(n)):\n",
    "    # parameters for PPP instance\n",
    "\n",
    "    cost_discount = 1.5 # discount factor for permit costs\n",
    "    durations = np.array([int(2**i) for i in range(num_permits)])  # costs of permits\n",
    "    costs = np.array([(2 / cost_discount)**i for i in range(num_permits)])\n",
    "\n",
    "    for test_sample in tqdm(range(num_years)):\n",
    "        instance = all_data[test_sample, :]\n",
    "        training_data = np.delete(all_data, test_sample, axis=0)\n",
    "\n",
    "        ratio_augmented, ratio_deterministic, ratio_randomized = \\\n",
    "            threeRatios(costs, durations, training_data, instance, alpha=0.5)\n",
    "\n",
    "        augmented_competitive_ratios[idx, test_sample] = ratio_augmented\n",
    "        deterministic_competitive_ratios[idx, test_sample] = ratio_deterministic\n",
    "        randomized_competitive_ratios[idx, test_sample] = ratio_randomized\n",
    "    ratios_augmented[idx] = np.mean(augmented_competitive_ratios[idx, :])\n",
    "    ratios_deterministic[idx] = np.mean(deterministic_competitive_ratios[idx, :])\n",
    "    ratios_randomized[idx] = np.mean(randomized_competitive_ratios[idx, :])\n",
    "np.save(f\"all_competitive_ratios_varying_n_discount_{cost_discount}_all_samples_augmented.npy\", augmented_competitive_ratios)\n",
    "np.save(f\"all_competitive_ratios_varying_n_discount_{cost_discount}_all_samples_deterministic.npy\", deterministic_competitive_ratios)\n",
    "np.save(f\"all_competitive_ratios_varying_n_discount_{cost_discount}_all_samples_randomized.npy\", randomized_competitive_ratios)\n",
    "\n",
    "plt.plot(n, ratios_augmented, label='Augmented Algorithm', marker='o')\n",
    "plt.plot(n, ratios_deterministic, label='Deterministic Algorithm', marker='x')\n",
    "plt.plot(n, ratios_randomized, label='Randomized Algorithm', marker='s')\n",
    "plt.xlabel('Number of Permit Types (n)')\n",
    "plt.ylabel('Competitive Ratio')\n",
    "plt.legend()\n",
    "plt.title('Competitive Ratios of Different Algorithms vs Number of Permit Types')\n",
    "plt.savefig(f'competitive_ratios_varying_n_discount_{cost_discount}_all_samples.png')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "890dbbf5",
   "metadata": {},
   "outputs": [],
   "source": [
    "cost_discount = 1.5\n",
    "\n",
    "augmented_competitive_ratios = np.load(f\"all_competitive_ratios_varying_n_discount_{cost_discount}_all_samples_augmented.npy\")\n",
    "deterministic_competitive_ratios = np.load(f\"all_competitive_ratios_varying_n_discount_{cost_discount}_all_samples_deterministic.npy\")\n",
    "randomized_competitive_ratios = np.load(f\"all_competitive_ratios_varying_n_discount_{cost_discount}_all_samples_randomized.npy\")\n",
    "\n",
    "augmented_means = np.mean(augmented_competitive_ratios, axis=1)\n",
    "deterministic_means = np.mean(deterministic_competitive_ratios, axis=1)\n",
    "randomized_means = np.mean(randomized_competitive_ratios, axis=1)\n",
    "\n",
    "augmented_std = np.std(augmented_competitive_ratios, axis=1)*1.96/np.sqrt(num_years)\n",
    "deterministic_std = np.std(deterministic_competitive_ratios, axis=1)*1.96/np.sqrt(num_years)\n",
    "randomized_std = np.std(randomized_competitive_ratios, axis=1)*1.96/np.sqrt(num_years)\n",
    "\n",
    "n = np.arange(2, 10)\n",
    "\n",
    "plt.plot(n, augmented_means, label='Augmented Algorithm', marker='o')\n",
    "plt.plot(n, deterministic_means, label='Deterministic Algorithm', marker='x')\n",
    "plt.plot(n, randomized_means, label='Randomized Algorithm', marker='s')\n",
    "plt.fill_between(n, augmented_means - augmented_std, augmented_means + augmented_std, alpha=0.2)\n",
    "plt.fill_between(n, deterministic_means - deterministic_std, deterministic_means + deterministic_std, alpha=0.2)\n",
    "plt.fill_between(n, randomized_means - randomized_std, randomized_means + randomized_std, alpha=0.2)\n",
    "plt.xlabel('Number of Permit Types', fontsize=16)\n",
    "plt.ylabel('Competitive Ratio', fontsize=16)\n",
    "plt.xticks(fontsize=14)\n",
    "plt.yticks(fontsize=14)\n",
    "plt.yticks(fontsize=14)\n",
    "plt.legend(fontsize=14)\n",
    "\n",
    "\n",
    "plt.savefig(f'competitive_ratios_varying_n_discount_{cost_discount}_all_samples.png')\n",
    "\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "63580246",
   "metadata": {},
   "outputs": [],
   "source": [
    "# do experiment with varying cost discount factor, over all test samples\n",
    "cost_discounts = np.arange(1.05, 2.0, 0.05)\n",
    "ratios_augmented = np.zeros(len(cost_discounts))\n",
    "ratios_deterministic = np.zeros(len(cost_discounts))\n",
    "ratios_randomized = np.zeros(len(cost_discounts))\n",
    "\n",
    "num_permits = 9\n",
    "\n",
    "num_years = all_data.shape[0]\n",
    "\n",
    "augmented_competitive_ratios = np.zeros((len(cost_discounts), num_years))\n",
    "deterministic_competitive_ratios = np.zeros((len(cost_discounts), num_years))\n",
    "randomized_competitive_ratios = np.zeros((len(cost_discounts), num_years))\n",
    "\n",
    "print(augmented_competitive_ratios.shape)\n",
    "\n",
    "\n",
    "for idx, cost_discount in enumerate(cost_discounts):\n",
    "\n",
    "    # parameters for PPP instance\n",
    "    durations = np.array([int(2**i) for i in range(num_permits)])  # costs of permits\n",
    "    costs = np.array([(2 / cost_discount)**i for i in range(num_permits)])\n",
    "\n",
    "\n",
    "    for test_sample in range(num_years):\n",
    "        instance = all_data[test_sample, :]\n",
    "        training_data = np.delete(all_data, test_sample, axis=0)\n",
    "        \n",
    "        augmented_competitive_ratios[idx, test_sample], deterministic_competitive_ratios[idx, test_sample], randomized_competitive_ratios[idx, test_sample] = \\\n",
    "            threeRatios(costs, durations, training_data, instance, alpha=0.5)\n",
    "\n",
    "    ratios_augmented[idx] = np.mean(augmented_competitive_ratios[idx, :])\n",
    "    ratios_deterministic[idx] = np.mean(deterministic_competitive_ratios[idx, :])\n",
    "    ratios_randomized[idx] = np.mean(randomized_competitive_ratios[idx, :])\n",
    "\n",
    "np.save(f\"all_competitive_ratios_varying_cost_discount_n_{num_permits}_all_samples_augmented.npy\", augmented_competitive_ratios)\n",
    "np.save(f\"all_competitive_ratios_varying_cost_discount_n_{num_permits}_all_samples_deterministic.npy\", deterministic_competitive_ratios)\n",
    "np.save(f\"all_competitive_ratios_varying_cost_discount_n_{num_permits}_all_samples_randomized.npy\", randomized_competitive_ratios)\n",
    "\n",
    "plt.plot(cost_discounts, ratios_augmented, label='Augmented Algorithm', marker='o')\n",
    "plt.plot(cost_discounts, ratios_deterministic, label='Deterministic Algorithm', marker='x')\n",
    "plt.plot(cost_discounts, ratios_randomized, label='Randomized Algorithm', marker='s')\n",
    "plt.xlabel('Cost Discount Factor')\n",
    "plt.ylabel('Competitive Ratio')\n",
    "plt.legend()\n",
    "plt.title('Competitive Ratios of Different Algorithms vs Cost Discount Factor')\n",
    "plt.savefig(f'competitive_ratios_varying_cost_discount_n_{num_permits}_all_samples.png')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3a4ed3ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "num_permits = 9\n",
    "cost_discounts = np.arange(1.05, 2.0, 0.05)\n",
    "num_years = all_data.shape[0]\n",
    "\n",
    "\n",
    "augmented_competitive_ratios = np.load(f\"all_competitive_ratios_varying_cost_discount_n_{num_permits}_all_samples_augmented.npy\")\n",
    "deterministic_competitive_ratios = np.load(f\"all_competitive_ratios_varying_cost_discount_n_{num_permits}_all_samples_deterministic.npy\")\n",
    "randomized_competitive_ratios = np.load(f\"all_competitive_ratios_varying_cost_discount_n_{num_permits}_all_samples_randomized.npy\")\n",
    "\n",
    "augmented_means = np.mean(augmented_competitive_ratios, axis=1)\n",
    "deterministic_means = np.mean(deterministic_competitive_ratios, axis=1)\n",
    "randomized_means = np.mean(randomized_competitive_ratios, axis=1)\n",
    "\n",
    "augmented_std = np.std(augmented_competitive_ratios, axis=1)/np.sqrt(num_years)*1.96\n",
    "deterministic_std = np.std(deterministic_competitive_ratios, axis=1)/np.sqrt(num_years)*1.96\n",
    "randomized_std = np.std(randomized_competitive_ratios, axis=1)/np.sqrt(num_years)*1.96\n",
    "\n",
    "\n",
    "plt.plot(cost_discounts, augmented_means, label='Augmented Algorithm', marker='o')\n",
    "plt.plot(cost_discounts, deterministic_means, label='Deterministic Algorithm', marker='x')\n",
    "plt.plot(cost_discounts, randomized_means, label='Randomized Algorithm', marker='s')\n",
    "plt.fill_between(cost_discounts, augmented_means - augmented_std, augmented_means + augmented_std, alpha=0.2)\n",
    "plt.fill_between(cost_discounts, deterministic_means - deterministic_std, deterministic_means + deterministic_std, alpha=0.2)\n",
    "plt.fill_between(cost_discounts, randomized_means - randomized_std, randomized_means + randomized_std, alpha=0.2)\n",
    "plt.xlabel('Discount Factor', fontsize=16)\n",
    "plt.ylabel('Competitive Ratio', fontsize=16)\n",
    "plt.xticks(fontsize=14)\n",
    "plt.yticks(fontsize=14)\n",
    "plt.yticks(fontsize=14)\n",
    "plt.legend(fontsize=14, loc=\"upper left\", framealpha=0.0)\n",
    "plt.savefig(f'competitive_ratios_varying_cost_discount_n_{num_permits}_all_samples.png')\n",
    "\n",
    "plt.show()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "dual-predictions",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
