{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Train agents"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "path_base = \"runs/put_option\"\n",
    "alphas = [\"0.4\", \"0.6\", \"0.8\", \"1.0\"]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import subprocess\n",
    "\n",
    "base_script = [\"python\", \"qrsrm.py\", \"--env-id\", \"AmericanOptionEnv-v0\", \"--save-model\", \"--n-quantiles\", \"50\", \"--total-timesteps\", \"1000000\", \"--gamma\", \"0.99\", \"--dir\", path_base, \"--risk-measure\", \"CVaR\"]\n",
    "\n",
    "scripts = [base_script + [\"--alpha\", alpha] for alpha in alphas]\n",
    "\n",
    "# Run each script\n",
    "for script in scripts:\n",
    "    print(f\"Running script {script}...\")\n",
    "    try:\n",
    "        subprocess.run(script, check=True)\n",
    "    except subprocess.CalledProcessError:\n",
    "        print(f\"Script {script} failed!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Run the simulations"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "from utils import run_simulation_from_dir, add_columns, make_agent_hue_kws\n",
    "from utils import AGENT_NAME_MAP\n",
    "from utils import plot_policy, option_execution_policy\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import os\n",
    "os.environ[\"KMP_DUPLICATE_LIB_OK\"]=\"TRUE\"\n",
    "\n",
    "import warnings\n",
    "warnings.filterwarnings(action='ignore', category=UserWarning)\n",
    "warnings.filterwarnings('ignore', category=DeprecationWarning)\n",
    "warnings.filterwarnings('ignore', category=RuntimeWarning)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "Nsimulations = 10000\n",
    "sim_seed = 1\n",
    "pkl_path = path_base + \"/df_exp.pkl\"\n",
    "if \"df_exp.pkl\" not in os.listdir(path_base):\n",
    "    df_exp = run_simulation_from_dir(path_base + \"/\", Nsimulations=Nsimulations, sim_seed=sim_seed)\n",
    "    df_exp.to_pickle(pkl_path)\n",
    "\n",
    "df_exp = pd.read_pickle(pkl_path)\n",
    "df_exp.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_exp = df_exp.pipe(add_columns)\n",
    "df = df_exp.sort_values(by=['agent', 'risk_measure', 'alpha', 'n_quantile', 'environment_name', 'agent_seed']).reset_index(drop=True)\n",
    "df.head()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Plot the figures"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "from IPython import display\n",
    "%matplotlib inline\n",
    "\n",
    "from matplotlib import ticker\n",
    "from matplotlib import rcParams\n",
    "\n",
    "import seaborn as sns\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "backend_format = \"retina\"  # @param [\"retina\", \"\"]\n",
    "%config InlineBackend.figure_format = backend_format\n",
    "\n",
    "sns.set_context(\"notebook\")\n",
    "sns.set_style(\"ticks\")\n",
    "\n",
    "rcParams['ytick.right'] = True\n",
    "rcParams['axes.autolimit_mode'] = 'round_numbers'\n",
    "rcParams['axes.xmargin'] = 0\n",
    "rcParams['axes.ymargin'] = 0\n",
    "\n",
    "rcParams['figure.figsize'] = [8, 5]\n",
    "rcParams['figure.dpi'] = 150\n",
    "\n",
    "rcParams['pdf.fonttype'] = 42\n",
    "rcParams['ps.fonttype'] = 42\n",
    "\n",
    "colors = sns.color_palette(n_colors=10)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "index_columns=['agent', 'risk_measure', 'alpha', 'sim_seed', 'Model']\n",
    "columns=['rewards']\n",
    "\n",
    "\n",
    "def cvar0(group):\n",
    "    # Perform some operation on the group\n",
    "    r_values = group.values\n",
    "    result = np.mean(r_values[r_values < np.quantile(r_values, 0.4)])\n",
    "    return result\n",
    "\n",
    "def cvar1(group):\n",
    "    # Perform some operation on the group\n",
    "    r_values = group.values\n",
    "    result = np.mean(r_values[r_values < np.quantile(r_values, 0.6)])\n",
    "    return result\n",
    "\n",
    "def cvar2(group):\n",
    "    # Perform some operation on the group\n",
    "    r_values = group.values\n",
    "    result = np.mean(r_values[r_values < np.quantile(r_values, 0.8)])\n",
    "    return result\n",
    "\n",
    "def cvar3(group):\n",
    "    # Perform some operation on the group\n",
    "    r_values = group.values\n",
    "    result = np.mean(r_values[r_values < np.quantile(r_values, 1.0)])\n",
    "    return result\n",
    "\n",
    "df_grouped = df.groupby(index_columns)[columns].agg([\n",
    "    (r\"$\\operatorname{CVaR}_{0.4}$\", cvar0),\n",
    "    (r\"$\\operatorname{CVaR}_{0.6}$\", cvar1),\n",
    "    (r\"$\\operatorname{CVaR}_{0.8}$\", cvar2),\n",
    "    (r\"$\\operatorname{CVaR}_{1.0}$\", cvar3),\n",
    "])\n",
    "\n",
    "\n",
    "# Drop 'rewards' level from columns\n",
    "df_grouped.columns = df_grouped.columns.droplevel(0)\n",
    "df_grouped.index = df_grouped.index.droplevel([0,1,2,3])\n",
    "df_grouped"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "alphas = [\"0.4\", \"0.6\", \"0.8\", \"1.0\"]\n",
    "agent_id_ordered_by_performance = [\"qrsrm_\" + alpha for alpha in alphas]\n",
    "\n",
    "experiments_ordered_by_performance = [dict(agent_id=agent_id,\n",
    "                                           agent_name=f\"{AGENT_NAME_MAP[agent_id.split('_')[0]]}(\" + r\"$\\alpha$=\" +  f\"{agent_id.split('_')[1]})\",\n",
    "                                           color=colors[i]) \n",
    "                                           for i, agent_id in enumerate(agent_id_ordered_by_performance)]\n",
    "\n",
    "agent_names, hue_kws = make_agent_hue_kws(experiments_ordered_by_performance)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig, ax = plt.subplots(figsize=(8, 5))\n",
    "\n",
    "sns.histplot(data=df, \n",
    "             x=\"rewards\", \n",
    "             hue=\"Model\", \n",
    "             stat=\"density\", \n",
    "             common_norm=False, \n",
    "             alpha=0.4,\n",
    "             bins=200, \n",
    "             kde=True,\n",
    "             hue_order=agent_names,\n",
    "             palette=colors,\n",
    "             legend='brief',\n",
    "             ax=ax,\n",
    "    )\n",
    "    \n",
    "\n",
    "# Add vertical lines\n",
    "line_styles = ['dotted', 'dotted', 'dashed', 'solid'] # 'dotted', 'dotted', 'dashed', \n",
    "# Add vertical lines\n",
    "for agent, value in df_grouped.iterrows():\n",
    "    for i, v in enumerate(value):\n",
    "        ax.vlines(x=v, \n",
    "                  ymin=0, \n",
    "                  ymax=4, \n",
    "                  colors=hue_kws['color'][agent_names.index(agent)], \n",
    "                  linestyles=line_styles[i],\n",
    "                  alpha=1,\n",
    "                  linewidth=1,\n",
    "                  )\n",
    "    \n",
    "ax.set_title('')\n",
    "ax.spines['right'].set_visible(True)\n",
    "ax.spines['top'].set_visible(True)\n",
    "ax.spines['left'].set_visible(True)\n",
    "ax.spines['bottom'].set_visible(True)\n",
    "ax.set_xlabel('Option Payoff')\n",
    "ax.set_ylabel('Density')\n",
    "ax.set_xlim([0, 0.7])\n",
    "ax.set_ylim([0, 4])\n",
    "\n",
    "# Get the existing legend\n",
    "legend = ax.get_legend()\n",
    "\n",
    "# Modify the legend\n",
    "legend.set_title('')\n",
    "legend.set_frame_on(False)\n",
    "# move to upper left\n",
    "\n",
    "plt.setp(legend.get_lines(), linewidth=3, alpha=0.5)\n",
    "\n",
    "fig.set_facecolor('white')\n",
    "fig.tight_layout()\n",
    "\n",
    "plt.savefig(path_base + '/comparison_put_option.pdf', transparent=True)\n",
    "plt.savefig(path_base + '/comparison_put_option.eps', format='eps', dpi=1200)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "pkl_path = path_base + \"/execution_s_df.pkl\"\n",
    "if \"execution_s_df.pkl\" not in os.listdir(path_base):\n",
    "    execution_s_df = option_execution_policy(path_base + \"/\", s_res=801)\n",
    "    execution_s_df = execution_s_df.pipe(add_columns)\n",
    "    execution_s_df.to_pickle(pkl_path)\n",
    "execution_s_df2 = pd.read_pickle(pkl_path)\n",
    "execution_s_df2.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig, ax = plt.subplots(figsize=(8, 5))\n",
    "\n",
    "sns.lineplot(data=execution_s_df, \n",
    "             x=\"index\",\n",
    "             y=\"execution_s\", \n",
    "             hue=\"Model\",\n",
    "             hue_order=agent_names,\n",
    "             palette=colors,\n",
    "             legend='brief',\n",
    "             ax=ax,\n",
    "             zorder=1,\n",
    "    )\n",
    "    \n",
    "    \n",
    "ax.set_title('')\n",
    "ax.spines['right'].set_visible(True)\n",
    "ax.spines['top'].set_visible(True)\n",
    "ax.spines['left'].set_visible(True)\n",
    "ax.spines['bottom'].set_visible(True)\n",
    "ax.set_xlabel('Time')\n",
    "ax.set_ylabel('Underlying Asset Price')\n",
    "#ax.set_xlim([0, 0.7])\n",
    "ax.set_ylim([0.5, 1.3])\n",
    "\n",
    "ax.hlines(y=1.0, xmin=0, xmax=10, colors='black', linestyles='dashed', linewidth=1, alpha=0.5, zorder=0)\n",
    "\n",
    "ax.yaxis.set_major_locator(ticker.MaxNLocator(nbins=10))\n",
    "ax.xaxis.set_major_locator(ticker.MaxNLocator(nbins=10))\n",
    "\n",
    "legend = ax.legend(loc='upper left', title='', frameon=False)\n",
    "plt.setp(legend.get_lines(), linewidth=3, alpha=0.5)\n",
    "\n",
    "fig.set_facecolor('white')\n",
    "fig.tight_layout()\n",
    "\n",
    "plt.savefig(path_base + '/comparison_put_option_policy.pdf', transparent=True)\n",
    "plt.savefig(path_base + '/comparison_put_option_policy.eps', format='eps', dpi=1200)\n",
    "plt.show()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "CleanRL",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
