{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import fnmatch\n",
    "from itertools import chain"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "import matplotlib.pyplot as plt\n",
    "import matplotlib.ticker as ticker\n",
    "import scienceplots\n",
    "plt.style.use('science')\n",
    "import torch\n",
    "import torch.nn.functional as F\n",
    "from py_vollib_vectorized import vectorized_black_scholes"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "resources = None"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "def load_csv(path, error):\n",
    "    df = pd.concat([pd.read_csv(f\"{path}/{f}\") for f in os.listdir(path) if fnmatch.fnmatch(f, f'{error}*.csv')])\n",
    "    df['quote_datetime'] = pd.to_datetime(df['quote_datetime'])\n",
    "    df = df.set_index('quote_datetime').sort_index()\n",
    "    return df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 89,
   "metadata": {},
   "outputs": [],
   "source": [
    "path_svi = \"../benchmark/store/9457192\"\n",
    "path_opds = \"../eval/store/9457504 (raw)\"\n",
    "path_opds = \"../eval/store/9457504 (finetune)\"\n",
    "\n",
    "df_svi_rel = load_csv(path_svi, 'rel')\n",
    "df_svi_fit = load_csv(path_svi, 'fit')\n",
    "df_opds_rel = load_csv(path_opds, 'rel')\n",
    "df_opds_fit = load_csv(path_opds, 'fit')\n",
    "df_opds_val = load_csv(path_opds, 'val')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 90,
   "metadata": {},
   "outputs": [],
   "source": [
    "quantiles = [0.01, 0.25, 0.5, 0.75, 0.99]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Train"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 91,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "      <th>min</th>\n",
       "      <th>%05</th>\n",
       "      <th>%25</th>\n",
       "      <th>%50</th>\n",
       "      <th>%75</th>\n",
       "      <th>%95</th>\n",
       "      <th>max</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>count</th>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>mean</th>\n",
       "      <td>0.497253</td>\n",
       "      <td>0.545995</td>\n",
       "      <td>0.000567</td>\n",
       "      <td>0.031151</td>\n",
       "      <td>0.156104</td>\n",
       "      <td>0.341886</td>\n",
       "      <td>0.638248</td>\n",
       "      <td>1.503813</td>\n",
       "      <td>4.717900</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>std</th>\n",
       "      <td>0.648529</td>\n",
       "      <td>1.218018</td>\n",
       "      <td>0.000727</td>\n",
       "      <td>0.027557</td>\n",
       "      <td>0.130315</td>\n",
       "      <td>0.275013</td>\n",
       "      <td>0.520658</td>\n",
       "      <td>2.883747</td>\n",
       "      <td>9.013502</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>min</th>\n",
       "      <td>0.171499</td>\n",
       "      <td>0.177059</td>\n",
       "      <td>0.000002</td>\n",
       "      <td>0.008121</td>\n",
       "      <td>0.042314</td>\n",
       "      <td>0.111040</td>\n",
       "      <td>0.217557</td>\n",
       "      <td>0.460855</td>\n",
       "      <td>1.032091</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1%</th>\n",
       "      <td>0.196420</td>\n",
       "      <td>0.205104</td>\n",
       "      <td>0.000006</td>\n",
       "      <td>0.010379</td>\n",
       "      <td>0.057861</td>\n",
       "      <td>0.127938</td>\n",
       "      <td>0.243217</td>\n",
       "      <td>0.563856</td>\n",
       "      <td>1.585475</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25%</th>\n",
       "      <td>0.277917</td>\n",
       "      <td>0.304651</td>\n",
       "      <td>0.000149</td>\n",
       "      <td>0.016785</td>\n",
       "      <td>0.085211</td>\n",
       "      <td>0.187753</td>\n",
       "      <td>0.355014</td>\n",
       "      <td>0.795932</td>\n",
       "      <td>2.634308</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50%</th>\n",
       "      <td>0.337123</td>\n",
       "      <td>0.390474</td>\n",
       "      <td>0.000351</td>\n",
       "      <td>0.021897</td>\n",
       "      <td>0.105531</td>\n",
       "      <td>0.232626</td>\n",
       "      <td>0.438643</td>\n",
       "      <td>0.993984</td>\n",
       "      <td>3.708775</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>75%</th>\n",
       "      <td>0.586727</td>\n",
       "      <td>0.567431</td>\n",
       "      <td>0.000743</td>\n",
       "      <td>0.038868</td>\n",
       "      <td>0.202520</td>\n",
       "      <td>0.443143</td>\n",
       "      <td>0.794579</td>\n",
       "      <td>1.599452</td>\n",
       "      <td>5.157061</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>99%</th>\n",
       "      <td>1.547546</td>\n",
       "      <td>1.607996</td>\n",
       "      <td>0.003032</td>\n",
       "      <td>0.101382</td>\n",
       "      <td>0.508274</td>\n",
       "      <td>1.061766</td>\n",
       "      <td>1.976541</td>\n",
       "      <td>4.444112</td>\n",
       "      <td>13.638719</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>max</th>\n",
       "      <td>11.852343</td>\n",
       "      <td>23.484888</td>\n",
       "      <td>0.008735</td>\n",
       "      <td>0.419003</td>\n",
       "      <td>1.845117</td>\n",
       "      <td>3.833368</td>\n",
       "      <td>7.078314</td>\n",
       "      <td>55.657773</td>\n",
       "      <td>184.357888</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "             mean         std         min         %05         %25         %50  \\\n",
       "count  749.000000  749.000000  749.000000  749.000000  749.000000  749.000000   \n",
       "mean     0.497253    0.545995    0.000567    0.031151    0.156104    0.341886   \n",
       "std      0.648529    1.218018    0.000727    0.027557    0.130315    0.275013   \n",
       "min      0.171499    0.177059    0.000002    0.008121    0.042314    0.111040   \n",
       "1%       0.196420    0.205104    0.000006    0.010379    0.057861    0.127938   \n",
       "25%      0.277917    0.304651    0.000149    0.016785    0.085211    0.187753   \n",
       "50%      0.337123    0.390474    0.000351    0.021897    0.105531    0.232626   \n",
       "75%      0.586727    0.567431    0.000743    0.038868    0.202520    0.443143   \n",
       "99%      1.547546    1.607996    0.003032    0.101382    0.508274    1.061766   \n",
       "max     11.852343   23.484888    0.008735    0.419003    1.845117    3.833368   \n",
       "\n",
       "              %75         %95         max  \n",
       "count  749.000000  749.000000  749.000000  \n",
       "mean     0.638248    1.503813    4.717900  \n",
       "std      0.520658    2.883747    9.013502  \n",
       "min      0.217557    0.460855    1.032091  \n",
       "1%       0.243217    0.563856    1.585475  \n",
       "25%      0.355014    0.795932    2.634308  \n",
       "50%      0.438643    0.993984    3.708775  \n",
       "75%      0.794579    1.599452    5.157061  \n",
       "99%      1.976541    4.444112   13.638719  \n",
       "max      7.078314   55.657773  184.357888  "
      ]
     },
     "execution_count": 91,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_opds_fit.loc[:'2020'].describe(quantiles)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 92,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>mean</th>\n",
       "      <th>std</th>\n",
       "      <th>min</th>\n",
       "      <th>%05</th>\n",
       "      <th>%25</th>\n",
       "      <th>%50</th>\n",
       "      <th>%75</th>\n",
       "      <th>%95</th>\n",
       "      <th>max</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>count</th>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>7.490000e+02</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "      <td>749.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>mean</th>\n",
       "      <td>1.123616</td>\n",
       "      <td>0.953206</td>\n",
       "      <td>1.524020e-03</td>\n",
       "      <td>0.086536</td>\n",
       "      <td>0.426409</td>\n",
       "      <td>0.919256</td>\n",
       "      <td>1.576387</td>\n",
       "      <td>2.828420</td>\n",
       "      <td>7.978836</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>std</th>\n",
       "      <td>0.876671</td>\n",
       "      <td>0.670179</td>\n",
       "      <td>1.896484e-03</td>\n",
       "      <td>0.073662</td>\n",
       "      <td>0.354180</td>\n",
       "      <td>0.754043</td>\n",
       "      <td>1.278844</td>\n",
       "      <td>2.149121</td>\n",
       "      <td>5.446723</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>min</th>\n",
       "      <td>0.206616</td>\n",
       "      <td>0.253300</td>\n",
       "      <td>6.461361e-07</td>\n",
       "      <td>0.009999</td>\n",
       "      <td>0.061111</td>\n",
       "      <td>0.141491</td>\n",
       "      <td>0.257653</td>\n",
       "      <td>0.585330</td>\n",
       "      <td>1.599859</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1%</th>\n",
       "      <td>0.301428</td>\n",
       "      <td>0.288382</td>\n",
       "      <td>1.789862e-05</td>\n",
       "      <td>0.013114</td>\n",
       "      <td>0.080643</td>\n",
       "      <td>0.187483</td>\n",
       "      <td>0.357677</td>\n",
       "      <td>0.816966</td>\n",
       "      <td>2.283418</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25%</th>\n",
       "      <td>0.492000</td>\n",
       "      <td>0.492095</td>\n",
       "      <td>3.460675e-04</td>\n",
       "      <td>0.033576</td>\n",
       "      <td>0.170079</td>\n",
       "      <td>0.370876</td>\n",
       "      <td>0.655797</td>\n",
       "      <td>1.304297</td>\n",
       "      <td>4.337394</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50%</th>\n",
       "      <td>0.714678</td>\n",
       "      <td>0.650060</td>\n",
       "      <td>9.000705e-04</td>\n",
       "      <td>0.056611</td>\n",
       "      <td>0.272639</td>\n",
       "      <td>0.575738</td>\n",
       "      <td>0.979799</td>\n",
       "      <td>1.867439</td>\n",
       "      <td>6.420889</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>75%</th>\n",
       "      <td>1.645634</td>\n",
       "      <td>1.341944</td>\n",
       "      <td>1.836054e-03</td>\n",
       "      <td>0.116529</td>\n",
       "      <td>0.591144</td>\n",
       "      <td>1.380361</td>\n",
       "      <td>2.360229</td>\n",
       "      <td>4.139196</td>\n",
       "      <td>10.039901</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>99%</th>\n",
       "      <td>3.709171</td>\n",
       "      <td>3.184627</td>\n",
       "      <td>9.419165e-03</td>\n",
       "      <td>0.298912</td>\n",
       "      <td>1.370154</td>\n",
       "      <td>2.986713</td>\n",
       "      <td>5.278008</td>\n",
       "      <td>9.754910</td>\n",
       "      <td>27.578416</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>max</th>\n",
       "      <td>4.782911</td>\n",
       "      <td>3.565918</td>\n",
       "      <td>1.414901e-02</td>\n",
       "      <td>0.408937</td>\n",
       "      <td>1.913362</td>\n",
       "      <td>4.004805</td>\n",
       "      <td>7.354547</td>\n",
       "      <td>10.912838</td>\n",
       "      <td>45.461859</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "             mean         std           min         %05         %25  \\\n",
       "count  749.000000  749.000000  7.490000e+02  749.000000  749.000000   \n",
       "mean     1.123616    0.953206  1.524020e-03    0.086536    0.426409   \n",
       "std      0.876671    0.670179  1.896484e-03    0.073662    0.354180   \n",
       "min      0.206616    0.253300  6.461361e-07    0.009999    0.061111   \n",
       "1%       0.301428    0.288382  1.789862e-05    0.013114    0.080643   \n",
       "25%      0.492000    0.492095  3.460675e-04    0.033576    0.170079   \n",
       "50%      0.714678    0.650060  9.000705e-04    0.056611    0.272639   \n",
       "75%      1.645634    1.341944  1.836054e-03    0.116529    0.591144   \n",
       "99%      3.709171    3.184627  9.419165e-03    0.298912    1.370154   \n",
       "max      4.782911    3.565918  1.414901e-02    0.408937    1.913362   \n",
       "\n",
       "              %50         %75         %95         max  \n",
       "count  749.000000  749.000000  749.000000  749.000000  \n",
       "mean     0.919256    1.576387    2.828420    7.978836  \n",
       "std      0.754043    1.278844    2.149121    5.446723  \n",
       "min      0.141491    0.257653    0.585330    1.599859  \n",
       "1%       0.187483    0.357677    0.816966    2.283418  \n",
       "25%      0.370876    0.655797    1.304297    4.337394  \n",
       "50%      0.575738    0.979799    1.867439    6.420889  \n",
       "75%      1.380361    2.360229    4.139196   10.039901  \n",
       "99%      2.986713    5.278008    9.754910   27.578416  \n",
       "max      4.004805    7.354547   10.912838   45.461859  "
      ]
     },
     "execution_count": 92,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_svi_fit.loc[:'2020'].describe(quantiles)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Test"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "metadata": {},
   "outputs": [],
   "source": [
    "opds = pd.concat((df_opds_fit.loc[:'2020':, 'mean'].describe(quantiles), df_opds_fit.loc['2020':, 'mean'].describe(quantiles)), axis=1).T"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 94,
   "metadata": {},
   "outputs": [],
   "source": [
    "svi = pd.concat((df_svi_fit.loc[:'2020':, 'mean'].describe(quantiles), df_svi_fit.loc['2020':, 'mean'].describe(quantiles)), axis=1).T"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 95,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lrrrrrrr}\n",
      "\\toprule\n",
      " & mean & std & 1% & 25% & 50% & 75% & 99% \\\\\n",
      "\\midrule\n",
      "mean & 1.123616 & 0.876671 & 0.301428 & 0.492000 & 0.714678 & 1.645634 & 3.709171 \\\\\n",
      "mean & 3.382108 & 0.825688 & 1.464073 & 2.827284 & 3.320280 & 3.913583 & 5.247109 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n",
      "\\begin{tabular}{lrrrrrrr}\n",
      "\\toprule\n",
      " & mean & std & 1% & 25% & 50% & 75% & 99% \\\\\n",
      "\\midrule\n",
      "mean & 0.497253 & 0.648529 & 0.196420 & 0.277917 & 0.337123 & 0.586727 & 1.547546 \\\\\n",
      "mean & 1.866320 & 0.574405 & 0.731633 & 1.456644 & 1.826409 & 2.232946 & 3.445215 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    }
   ],
   "source": [
    "cols = ['mean', 'std', '1%', '25%', '50%', '75%', '99%']\n",
    "print(svi[cols].to_latex())\n",
    "print(opds[cols].to_latex())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 98,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lrrrrrrr}\n",
      "\\toprule\n",
      " & mean & std & 1% & 25% & 50% & 75% & 99% \\\\\n",
      "\\midrule\n",
      "mean & 0.009300 & 0.006654 & 0.003333 & 0.005818 & 0.008569 & 0.011010 & 0.021351 \\\\\n",
      "mean & 0.007496 & 0.001694 & 0.003690 & 0.006591 & 0.007478 & 0.008376 & 0.011817 \\\\\n",
      "\\bottomrule\n",
      "\\end{tabular}\n",
      "\n"
     ]
    }
   ],
   "source": [
    "opds = pd.concat((df_opds_rel.loc[:'2020':, 'mean'].describe(quantiles), df_opds_rel.loc['2020':, 'mean'].describe(quantiles)), axis=1).T\n",
    "svi = pd.concat((df_svi_rel.loc[:'2020':, 'mean'].describe(quantiles), df_svi_rel.loc['2020':, 'mean'].describe(quantiles)), axis=1).T\n",
    "cols = ['mean', 'std', '1%', '25%', '50%', '75%', '99%']\n",
    "#print(svi[cols].to_latex())\n",
    "print(opds[cols].to_latex())"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Validation Loss"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "metadata": {},
   "outputs": [],
   "source": [
    "val_file = \"../train/store/9448705/checkpoints/val_final.csv\"\n",
    "val_df = pd.read_csv(val_file)\n",
    "val_df['cal']\n",
    "val_df['quote_datetime'] = pd.to_datetime(val_df['quote_datetime'])\n",
    "val_df = val_df.set_index('quote_datetime')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\\begin{tabular}{lrrrrrrr}\n",
      " & mean & std & min & 25% & 50% & 75% & max \\\\\n",
      "loss & 0.062 & 0.032 & 0.029 & 0.053 & 0.059 & 0.064 & 0.506 \\\\\n",
      "rel & 0.022 & 0.016 & 0.009 & 0.016 & 0.020 & 0.024 & 0.232 \\\\\n",
      "but & 0.000 & 0.000 & 0.000 & 0.000 & 0.000 & 0.000 & 0.000 \\\\\n",
      "cal & 0.000 & 0.001 & 0.000 & 0.000 & 0.000 & 0.000 & 0.008 \\\\\n",
      "reg_z & 0.644 & 0.137 & 0.196 & 0.538 & 0.641 & 0.747 & 0.996 \\\\\n",
      "reg_r & 0.143 & 0.254 & 0.048 & 0.083 & 0.101 & 0.134 & 5.154 \\\\\n",
      "\\end{tabular}\n",
      "\n"
     ]
    }
   ],
   "source": [
    "cols = ['loss', 'rel', 'but', 'cal', 'reg_z', 'reg_r']\n",
    "desc = val_df[cols].describe().T.drop(columns='count')\n",
    "print(desc.style.format(precision=3).to_latex())"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "op-ds-cqZ6S183-py3.11",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
