{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Train agents"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "path_base = \"runs/table_results\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import subprocess\n",
    "\n",
    "# Create each script by appending the unique part to the base script\n",
    "shared_hyperparameters = [\"--env-id\", \"TradingEnv-v0\", \"--save-model\", \"--n-quantiles\", \"200\", \"--total-timesteps\", \"1000000\", \"--dir\", path_base]\n",
    "\n",
    "base_script1 = [\"python\", \"qrdqn.py\"] + shared_hyperparameters\n",
    "base_script2 = [\"python\", \"qrcvar.py\"] + shared_hyperparameters\n",
    "base_script3 = [\"python\", \"qricvar.py\"] + shared_hyperparameters\n",
    "base_script4 = [\"python\", \"qrsrm.py\"] + shared_hyperparameters\n",
    "\n",
    "scripts1 = [base_script1]\n",
    "scripts2 = [base_script2 + [\"--alpha\", alpha] for alpha in [\"0.2\", \"0.5\", \"1.0\"]]\n",
    "scripts3 = [base_script3 + [\"--alpha\", alpha] for alpha in [\"0.2\", \"0.5\"]]\n",
    "scripts4 = [base_script4 + [\"--risk-measure\", \"CVaR\", \"--alpha\", alpha] for alpha in [\"0.2\", \"0.5\", \"1.0\"]]  \n",
    "scripts5 = [base_script4 + [\"--risk-measure\", \"Exp\", \"--alpha\", alpha] for alpha in [\"4\"]]\n",
    "scripts6 = [base_script4 + [\"--risk-measure\", \"Dual\", \"--alpha\", alpha] for alpha in [\"2\"]]\n",
    "scripts7 = [base_script4 + [\"--risk-measure\", \"WSCVaR\", \"--alphas\", \"0.1,0.6,1.0\", \"--weights\", \"0.2,0.3,0.5\"]]\n",
    "scripts8 = [base_script4 + [\"--risk-measure\", \"WSCVaR\", \"--alphas\", \"0.2,1.0\", \"--weights\", \"0.5,0.5\"]]\n",
    "\n",
    "scripts = scripts1 + scripts2 + scripts3 + scripts4 + scripts5 + scripts6 + scripts7 + scripts8\n",
    "\n",
    "seeds = [\"1\", \"2\", \"3\", \"4\", \"5\"]\n",
    "scripts = [script + [\"--seed\", seed] for script in scripts for seed in seeds]\n",
    "# Run each script\n",
    "for script in scripts:\n",
    "    print(f\"Running script {script}...\")\n",
    "    try:\n",
    "        subprocess.run(script, check=True)\n",
    "    except subprocess.CalledProcessError:\n",
    "        print(f\"Script {script} failed!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Run the simulations"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "from utils import run_simulation_from_dir, add_columns, make_agent_hue_kws\n",
    "from utils import AGENT_NAME_MAP, AGG_RISK_VALUES\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import os\n",
    "os.environ[\"KMP_DUPLICATE_LIB_OK\"]=\"TRUE\"\n",
    "\n",
    "import warnings\n",
    "warnings.filterwarnings('ignore', category=UserWarning)\n",
    "warnings.filterwarnings('ignore', category=DeprecationWarning)\n",
    "warnings.filterwarnings('ignore', category=RuntimeWarning)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "Nsimulations = 10000\n",
    "sim_seed = 6\n",
    "pkl_path = path_base+\"/df_exp.pkl\"\n",
    "if \"df_exp.pkl\" not in os.listdir(path_base):\n",
    "    df_exp = run_simulation_from_dir(path_base + \"/\", Nsimulations=Nsimulations, sim_seed=sim_seed)\n",
    "    df_exp.to_pickle(pkl_path)\n",
    "\n",
    "df_exp = pd.read_pickle(pkl_path)\n",
    "df_exp = df_exp.pipe(add_columns)\n",
    "df_exp = df_exp.sort_values(by=['agent', 'risk_measure', 'alpha', 'n_quantile', 'environment_name', 'agent_seed']).reset_index(drop=True)\n",
    "print(df_exp.shape)\n",
    "df_exp.head()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Results"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "index_columns=['agent', 'risk_measure', 'alpha', 'sim_seed', 'Model', 'agent_seed']\n",
    "columns=['rewards']\n",
    "\n",
    "df_grouped = df_exp.groupby(index_columns)[columns].agg(AGG_RISK_VALUES)\n",
    "\n",
    "\n",
    "# Drop 'rewards' level from columns\n",
    "df_grouped.columns = df_grouped.columns.droplevel(0)\n",
    "df_grouped.index = df_grouped.index.droplevel([0,1,2,3])\n",
    "df_grouped = df_grouped.reset_index()\n",
    "df_grouped.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Calculate mean and std separately\n",
    "mean_df = df_grouped.groupby(['Model']).mean()\n",
    "std_df = df_grouped.groupby(['Model']).std()\n",
    "mean_df.drop(columns=['agent_seed'], inplace=True)\n",
    "std_df.drop(columns=['agent_seed'], inplace=True)\n",
    "# Create a new DataFrame with the same structure as mean_df\n",
    "result_df = mean_df.copy()\n",
    "\n",
    "# For each column in the DataFrame, format the values as \"mean ± std\"\n",
    "for col in result_df.columns:\n",
    "    result_df[col] = mean_df[col].map(\"{:.2f}\".format) + \"±\" + std_df[col].map(\"{:.2f}\".format)\n",
    "\n",
    "result_df.reset_index(inplace=True)\n",
    "result_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_models = ['QR-SRM($\\\\alpha$=1.0)', \n",
    "                 'QR-CVaR($\\\\alpha$=1.0)',\n",
    "                 'QR-DQN', \n",
    "                 'QR-SRM($\\\\alpha$=0.5)', \n",
    "                 'QR-CVaR($\\\\alpha$=0.5)', \n",
    "                 'QR-iCVaR($\\\\alpha$=0.5)',\n",
    "                 'QR-SRM($\\\\alpha$=0.2)',                                \n",
    "                 'QR-CVaR($\\\\alpha$=0.2)',                                                   \n",
    "                 'QR-iCVaR($\\\\alpha$=0.2)', \n",
    "                 'QR-SRM($\\\\lambda$=4.0)',\n",
    "                 'QR-SRM($\\\\nu$=2.0)',\n",
    "                 'QR-SRM($\\\\alpha$=0.1,0.6,1.0)',\n",
    "                 'QR-SRM($\\\\alpha$=0.2,1.0)']\n",
    "\n",
    "chosen_columns = ['Model', '$\\operatorname{CVaR}_{1.0}$', '$\\operatorname{CVaR}_{0.5}$', '$\\operatorname{CVaR}_{0.2}$', '$\\operatorname{ERM}_{4.0}$', '$\\operatorname{DPRM}_{2.0}$', '$\\operatorname{WSCVaR}_{0.1,0.6,1.0}$', '$\\operatorname{WSCVaR}_{0.2,1.0}_{0.5,0.5}$']\n",
    "\n",
    "result_df_ordered = result_df[result_df['Model'].isin(chosen_models)].reset_index(drop=True)\n",
    "result_df_ordered['Model'] = pd.Categorical(result_df_ordered['Model'], categories=chosen_models, ordered=True)\n",
    "result_df_ordered = result_df_ordered[chosen_columns]\n",
    "\n",
    "# Sort by the 'Model' column\n",
    "result_df_ordered = result_df_ordered.sort_values('Model')\n",
    "\n",
    "# Reset the index\n",
    "result_df_ordered = result_df_ordered.reset_index(drop=True)\n",
    "\n",
    "result_df_ordered"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "result_df_ordered.to_latex(path_base + \"/result_df.tex\", column_format='|l|ccccccc|', escape=False, index=False)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "CleanRL",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
