{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "08bb2bb7-d451-43e2-8f24-c1559fa12167",
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "sys.path.insert(0, '../Results')\n",
    "sys.path.insert(0, '../../src')\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "import pickle\n",
    "import os\n",
    "from utils.visualization_utils import perc, SetPlotRC, ApplyFont\n",
    "\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "01b17731-2e95-4d18-a7e9-397f0bf725a5",
   "metadata": {},
   "source": [
    "# Synthetic Low Dim Nystorm Run Time Test"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "ca9fc11b-5eba-4b64-8e36-4809edec56b5",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(25, 6)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Algorithm</th>\n",
       "      <th>Data_Size</th>\n",
       "      <th>MSE</th>\n",
       "      <th>MSE_std</th>\n",
       "      <th>Algo_Run_Time_mean</th>\n",
       "      <th>Algo_Run_Time_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>DRKPV</td>\n",
       "      <td>1200</td>\n",
       "      <td>0.021700</td>\n",
       "      <td>0.007830</td>\n",
       "      <td>2.421597</td>\n",
       "      <td>0.236941</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>DRKPV</td>\n",
       "      <td>2500</td>\n",
       "      <td>0.017104</td>\n",
       "      <td>0.008678</td>\n",
       "      <td>9.088704</td>\n",
       "      <td>0.056563</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>DRKPV</td>\n",
       "      <td>5000</td>\n",
       "      <td>0.009786</td>\n",
       "      <td>0.004663</td>\n",
       "      <td>61.192683</td>\n",
       "      <td>0.213240</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>DRKPV</td>\n",
       "      <td>7500</td>\n",
       "      <td>0.007070</td>\n",
       "      <td>0.003314</td>\n",
       "      <td>194.550722</td>\n",
       "      <td>0.354121</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>DRKPV</td>\n",
       "      <td>10000</td>\n",
       "      <td>0.006560</td>\n",
       "      <td>0.002637</td>\n",
       "      <td>453.970543</td>\n",
       "      <td>0.518654</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  Algorithm  Data_Size       MSE   MSE_std  Algo_Run_Time_mean  \\\n",
       "0     DRKPV       1200  0.021700  0.007830            2.421597   \n",
       "1     DRKPV       2500  0.017104  0.008678            9.088704   \n",
       "2     DRKPV       5000  0.009786  0.004663           61.192683   \n",
       "3     DRKPV       7500  0.007070  0.003314          194.550722   \n",
       "4     DRKPV      10000  0.006560  0.002637          453.970543   \n",
       "\n",
       "   Algo_Run_Time_std  \n",
       "0           0.236941  \n",
       "1           0.056563  \n",
       "2           0.213240  \n",
       "3           0.354121  \n",
       "4           0.518654  "
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_doubly_robustKPV = pd.read_pickle(r\"../Results/DoublyRobustKPV_Original_RunTime_SyntheticLowDim_Experiment.pkl\")\n",
    "# We omit the first run to exclude the time required for jit\n",
    "df_doubly_robustKPV_ = df_doubly_robustKPV.loc[df_doubly_robustKPV[\"Seed\"] != 0]\n",
    "print(df_doubly_robustKPV_.shape)\n",
    "\n",
    "df_results_aggregated = df_doubly_robustKPV_.groupby(['Algorithm', 'Data_Size']).agg({ \"Causal_MSE\" : [\"mean\", \"std\"], \"Algo_Run_Time\" : [\"mean\", \"std\"]}).set_axis([\"MSE\", \"MSE_std\", \"Algo_Run_Time_mean\", \"Algo_Run_Time_std\"], axis=1).reset_index()\n",
    "df_results_aggregated"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "e704b1c0-345d-468a-bff2-7b7063b5c2fb",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_doubly_robustKPV_;"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "998bc9c8-04d5-49ef-8f8a-c086bd811c12",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(25, 6)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Algorithm</th>\n",
       "      <th>Data_Size</th>\n",
       "      <th>MSE</th>\n",
       "      <th>MSE_std</th>\n",
       "      <th>Algo_Run_Time_mean</th>\n",
       "      <th>Algo_Run_Time_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>1200</td>\n",
       "      <td>0.027207</td>\n",
       "      <td>0.014267</td>\n",
       "      <td>2.666027</td>\n",
       "      <td>0.406305</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>2500</td>\n",
       "      <td>0.013974</td>\n",
       "      <td>0.009974</td>\n",
       "      <td>6.866250</td>\n",
       "      <td>0.043354</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>5000</td>\n",
       "      <td>0.008258</td>\n",
       "      <td>0.003377</td>\n",
       "      <td>42.589306</td>\n",
       "      <td>0.190298</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>7500</td>\n",
       "      <td>0.008577</td>\n",
       "      <td>0.004488</td>\n",
       "      <td>132.785315</td>\n",
       "      <td>0.046655</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>10000</td>\n",
       "      <td>0.005981</td>\n",
       "      <td>0.001470</td>\n",
       "      <td>306.791327</td>\n",
       "      <td>0.023344</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       Algorithm  Data_Size       MSE   MSE_std  Algo_Run_Time_mean  \\\n",
       "0  DRKPV_Nystorm       1200  0.027207  0.014267            2.666027   \n",
       "1  DRKPV_Nystorm       2500  0.013974  0.009974            6.866250   \n",
       "2  DRKPV_Nystorm       5000  0.008258  0.003377           42.589306   \n",
       "3  DRKPV_Nystorm       7500  0.008577  0.004488          132.785315   \n",
       "4  DRKPV_Nystorm      10000  0.005981  0.001470          306.791327   \n",
       "\n",
       "   Algo_Run_Time_std  \n",
       "0           0.406305  \n",
       "1           0.043354  \n",
       "2           0.190298  \n",
       "3           0.046655  \n",
       "4           0.023344  "
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_doubly_robustKPV_Nystorm_500Landmarks = pd.read_pickle(r\"../Results/DoublyRobustKPV_Nystorm_RunTime_SyntheticLowDim_Experiment_500Landmarks.pkl\")\n",
    "# We omit the first run to exclude the time required for jit\n",
    "df_doubly_robustKPV_Nystorm_500Landmarks_ = df_doubly_robustKPV_Nystorm_500Landmarks.loc[df_doubly_robustKPV_Nystorm_500Landmarks[\"Seed\"] != 0]\n",
    "print(df_doubly_robustKPV_Nystorm_500Landmarks_.shape)\n",
    "\n",
    "df_results_aggregated = df_doubly_robustKPV_Nystorm_500Landmarks_.groupby(['Algorithm', 'Data_Size']).agg({ \"Causal_MSE\" : [\"mean\", \"std\"], \"Algo_Run_Time\" : [\"mean\", \"std\"]}).set_axis([\"MSE\", \"MSE_std\", \"Algo_Run_Time_mean\", \"Algo_Run_Time_std\"], axis=1).reset_index()\n",
    "df_results_aggregated"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "32d69200-19c4-4046-bd8f-e1643ff2501d",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_doubly_robustKPV_Nystorm_500Landmarks;"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "f2950c50-abe2-41ce-9db4-d7e56ed2b282",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(25, 6)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Algorithm</th>\n",
       "      <th>Data_Size</th>\n",
       "      <th>MSE</th>\n",
       "      <th>MSE_std</th>\n",
       "      <th>Algo_Run_Time_mean</th>\n",
       "      <th>Algo_Run_Time_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>1200</td>\n",
       "      <td>0.030845</td>\n",
       "      <td>0.014338</td>\n",
       "      <td>1.670128</td>\n",
       "      <td>0.007628</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>2500</td>\n",
       "      <td>0.016344</td>\n",
       "      <td>0.012137</td>\n",
       "      <td>5.771109</td>\n",
       "      <td>0.006736</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>5000</td>\n",
       "      <td>0.007113</td>\n",
       "      <td>0.002826</td>\n",
       "      <td>39.235685</td>\n",
       "      <td>0.228359</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>7500</td>\n",
       "      <td>0.009142</td>\n",
       "      <td>0.004648</td>\n",
       "      <td>127.640661</td>\n",
       "      <td>0.003948</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>10000</td>\n",
       "      <td>0.006278</td>\n",
       "      <td>0.002231</td>\n",
       "      <td>299.525365</td>\n",
       "      <td>0.005270</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       Algorithm  Data_Size       MSE   MSE_std  Algo_Run_Time_mean  \\\n",
       "0  DRKPV_Nystorm       1200  0.030845  0.014338            1.670128   \n",
       "1  DRKPV_Nystorm       2500  0.016344  0.012137            5.771109   \n",
       "2  DRKPV_Nystorm       5000  0.007113  0.002826           39.235685   \n",
       "3  DRKPV_Nystorm       7500  0.009142  0.004648          127.640661   \n",
       "4  DRKPV_Nystorm      10000  0.006278  0.002231          299.525365   \n",
       "\n",
       "   Algo_Run_Time_std  \n",
       "0           0.007628  \n",
       "1           0.006736  \n",
       "2           0.228359  \n",
       "3           0.003948  \n",
       "4           0.005270  "
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_doubly_robustKPV_Nystorm_100Landmarks = pd.read_pickle(r\"../Results/DoublyRobustKPV_Nystorm_RunTime_SyntheticLowDim_Experiment_100Landmarks.pkl\")\n",
    "# We omit the first run to exclude the time required for jit\n",
    "df_doubly_robustKPV_Nystorm_100Landmarks_ = df_doubly_robustKPV_Nystorm_100Landmarks.loc[df_doubly_robustKPV_Nystorm_100Landmarks[\"Seed\"] != 0]\n",
    "print(df_doubly_robustKPV_Nystorm_100Landmarks_.shape)\n",
    "\n",
    "df_results_aggregated = df_doubly_robustKPV_Nystorm_100Landmarks_.groupby(['Algorithm', 'Data_Size']).agg({ \"Causal_MSE\" : [\"mean\", \"std\"], \"Algo_Run_Time\" : [\"mean\", \"std\"]}).set_axis([\"MSE\", \"MSE_std\", \"Algo_Run_Time_mean\", \"Algo_Run_Time_std\"], axis=1).reset_index()\n",
    "df_results_aggregated"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "8ca38aa4-02ad-42cc-aa9b-9eaa8c968159",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_doubly_robustKPV_Nystorm_100Landmarks;"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "3605a6e6-dde0-4e89-bd32-1e38ce118d33",
   "metadata": {},
   "source": [
    "# dSprite Nystorm Run Time Test"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "f3471d46-bf1d-417d-8770-079cf74e5711",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(20, 6)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Algorithm</th>\n",
       "      <th>Data_Size</th>\n",
       "      <th>MSE</th>\n",
       "      <th>MSE_std</th>\n",
       "      <th>Algo_Run_Time_mean</th>\n",
       "      <th>Algo_Run_Time_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>DRKPV</td>\n",
       "      <td>1200</td>\n",
       "      <td>23.063602</td>\n",
       "      <td>0.957346</td>\n",
       "      <td>12.459968</td>\n",
       "      <td>0.270915</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>DRKPV</td>\n",
       "      <td>2500</td>\n",
       "      <td>19.092623</td>\n",
       "      <td>1.191034</td>\n",
       "      <td>49.638227</td>\n",
       "      <td>0.122024</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>DRKPV</td>\n",
       "      <td>5000</td>\n",
       "      <td>19.137830</td>\n",
       "      <td>0.858941</td>\n",
       "      <td>342.469084</td>\n",
       "      <td>0.383110</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>DRKPV</td>\n",
       "      <td>7500</td>\n",
       "      <td>18.305179</td>\n",
       "      <td>0.491819</td>\n",
       "      <td>1097.604932</td>\n",
       "      <td>1.184233</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  Algorithm  Data_Size        MSE   MSE_std  Algo_Run_Time_mean  \\\n",
       "0     DRKPV       1200  23.063602  0.957346           12.459968   \n",
       "1     DRKPV       2500  19.092623  1.191034           49.638227   \n",
       "2     DRKPV       5000  19.137830  0.858941          342.469084   \n",
       "3     DRKPV       7500  18.305179  0.491819         1097.604932   \n",
       "\n",
       "   Algo_Run_Time_std  \n",
       "0           0.270915  \n",
       "1           0.122024  \n",
       "2           0.383110  \n",
       "3           1.184233  "
      ]
     },
     "execution_count": 19,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_doubly_robustKPV = pd.read_pickle(r\"../Results/DoublyRobustKPV_Original_RunTime_dSprite_Experiment.pkl\")\n",
    "# We omit the first run to exclude the time required for jit\n",
    "df_doubly_robustKPV_ = df_doubly_robustKPV.loc[df_doubly_robustKPV[\"Seed\"] != 0]\n",
    "print(df_doubly_robustKPV_.shape)\n",
    "\n",
    "df_results_aggregated = df_doubly_robustKPV_.groupby(['Algorithm', 'Data_Size']).agg({ \"Causal_MSE\" : [\"mean\", \"std\"], \"Algo_Run_Time\" : [\"mean\", \"std\"]}).set_axis([\"MSE\", \"MSE_std\", \"Algo_Run_Time_mean\", \"Algo_Run_Time_std\"], axis=1).reset_index()\n",
    "df_results_aggregated"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "6e596762-c5f5-4d73-9f9b-1c7215954d5c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(21, 6)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Algorithm</th>\n",
       "      <th>Data_Size</th>\n",
       "      <th>MSE</th>\n",
       "      <th>MSE_std</th>\n",
       "      <th>Algo_Run_Time_mean</th>\n",
       "      <th>Algo_Run_Time_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>1200</td>\n",
       "      <td>26.276701</td>\n",
       "      <td>0.810112</td>\n",
       "      <td>13.459185</td>\n",
       "      <td>0.481747</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>2500</td>\n",
       "      <td>22.864513</td>\n",
       "      <td>1.417806</td>\n",
       "      <td>39.652405</td>\n",
       "      <td>0.200449</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>5000</td>\n",
       "      <td>21.556288</td>\n",
       "      <td>1.280305</td>\n",
       "      <td>253.234233</td>\n",
       "      <td>0.029531</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>7500</td>\n",
       "      <td>20.617078</td>\n",
       "      <td>0.798476</td>\n",
       "      <td>780.061212</td>\n",
       "      <td>1.828095</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>10000</td>\n",
       "      <td>19.681630</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1804.246104</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       Algorithm  Data_Size        MSE   MSE_std  Algo_Run_Time_mean  \\\n",
       "0  DRKPV_Nystorm       1200  26.276701  0.810112           13.459185   \n",
       "1  DRKPV_Nystorm       2500  22.864513  1.417806           39.652405   \n",
       "2  DRKPV_Nystorm       5000  21.556288  1.280305          253.234233   \n",
       "3  DRKPV_Nystorm       7500  20.617078  0.798476          780.061212   \n",
       "4  DRKPV_Nystorm      10000  19.681630       NaN         1804.246104   \n",
       "\n",
       "   Algo_Run_Time_std  \n",
       "0           0.481747  \n",
       "1           0.200449  \n",
       "2           0.029531  \n",
       "3           1.828095  \n",
       "4                NaN  "
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_doubly_robustKPV_Nystorm_500Landmarks = pd.read_pickle(r\"../Results/DoublyRobustKPV_Nystorm_RunTime_dSprite_Experiment_500Landmarks.pkl\")\n",
    "# We omit the first run to exclude the time required for jit\n",
    "df_doubly_robustKPV_Nystorm_500Landmarks_ = df_doubly_robustKPV_Nystorm_500Landmarks.loc[df_doubly_robustKPV_Nystorm_500Landmarks[\"Seed\"] != 0]\n",
    "print(df_doubly_robustKPV_Nystorm_500Landmarks_.shape)\n",
    "\n",
    "df_results_aggregated = df_doubly_robustKPV_Nystorm_500Landmarks_.groupby(['Algorithm', 'Data_Size']).agg({ \"Causal_MSE\" : [\"mean\", \"std\"], \"Algo_Run_Time\" : [\"mean\", \"std\"]}).set_axis([\"MSE\", \"MSE_std\", \"Algo_Run_Time_mean\", \"Algo_Run_Time_std\"], axis=1).reset_index()\n",
    "df_results_aggregated"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "0a8c8c0c-dc42-4d0d-b582-4934578913c6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(21, 6)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Algorithm</th>\n",
       "      <th>Data_Size</th>\n",
       "      <th>MSE</th>\n",
       "      <th>MSE_std</th>\n",
       "      <th>Algo_Run_Time_mean</th>\n",
       "      <th>Algo_Run_Time_std</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>1200</td>\n",
       "      <td>34.409396</td>\n",
       "      <td>3.603166</td>\n",
       "      <td>9.700455</td>\n",
       "      <td>0.012629</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>2500</td>\n",
       "      <td>32.762104</td>\n",
       "      <td>3.370687</td>\n",
       "      <td>35.081570</td>\n",
       "      <td>0.020590</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>5000</td>\n",
       "      <td>29.710542</td>\n",
       "      <td>4.625312</td>\n",
       "      <td>233.653266</td>\n",
       "      <td>0.093116</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>7500</td>\n",
       "      <td>30.322744</td>\n",
       "      <td>2.146888</td>\n",
       "      <td>748.795840</td>\n",
       "      <td>0.036311</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>DRKPV_Nystorm</td>\n",
       "      <td>10000</td>\n",
       "      <td>27.499987</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1749.095387</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       Algorithm  Data_Size        MSE   MSE_std  Algo_Run_Time_mean  \\\n",
       "0  DRKPV_Nystorm       1200  34.409396  3.603166            9.700455   \n",
       "1  DRKPV_Nystorm       2500  32.762104  3.370687           35.081570   \n",
       "2  DRKPV_Nystorm       5000  29.710542  4.625312          233.653266   \n",
       "3  DRKPV_Nystorm       7500  30.322744  2.146888          748.795840   \n",
       "4  DRKPV_Nystorm      10000  27.499987       NaN         1749.095387   \n",
       "\n",
       "   Algo_Run_Time_std  \n",
       "0           0.012629  \n",
       "1           0.020590  \n",
       "2           0.093116  \n",
       "3           0.036311  \n",
       "4                NaN  "
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_doubly_robustKPV_Nystorm_500Landmarks = pd.read_pickle(r\"../Results/DoublyRobustKPV_Nystorm_RunTime_dSprite_Experiment_100Landmarks.pkl\")\n",
    "# We omit the first run to exclude the time required for jit\n",
    "df_doubly_robustKPV_Nystorm_500Landmarks_ = df_doubly_robustKPV_Nystorm_500Landmarks.loc[df_doubly_robustKPV_Nystorm_500Landmarks[\"Seed\"] != 0]\n",
    "print(df_doubly_robustKPV_Nystorm_500Landmarks_.shape)\n",
    "\n",
    "df_results_aggregated = df_doubly_robustKPV_Nystorm_500Landmarks_.groupby(['Algorithm', 'Data_Size']).agg({ \"Causal_MSE\" : [\"mean\", \"std\"], \"Algo_Run_Time\" : [\"mean\", \"std\"]}).set_axis([\"MSE\", \"MSE_std\", \"Algo_Run_Time_mean\", \"Algo_Run_Time_std\"], axis=1).reset_index()\n",
    "df_results_aggregated"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "546791fe-431f-4bf4-b072-1ab985bfa2ea",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
