{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Skipped loading some Tensorflow models, missing a dependency. No module named 'tensorflow'\n",
      "\u001b[34m\u001b[1mwandb\u001b[0m: \u001b[33mWARNING\u001b[0m W&B installed but not logged in.  Run `wandb login` or set the WANDB_API_KEY env variable.\n",
      "Skipped loading modules with pytorch-geometric dependency, missing a dependency. No module named 'torch_geometric'\n",
      "Skipped loading modules with pytorch-geometric dependency, missing a dependency. cannot import name 'DMPNN' from 'deepchem.models.torch_models' (/home/simon/miniconda3/envs/lohi_benchmark/lib/python3.10/site-packages/deepchem/models/torch_models/__init__.py)\n",
      "Skipped loading some Jax models, missing a dependency. No module named 'jax'\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.append('../../../../code')\n",
    "\n",
    "from metrics import get_hi_metrics, get_summary_metrics, get_list_of_methods, compile_summary_table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "predictions_path = '../../../../predictions/hi/drd2/'\n",
    "methods = get_list_of_methods(predictions_path)\n",
    "train_means, train_stds, test_means, test_stds = get_summary_metrics(predictions_path, methods, get_hi_metrics)\n",
    "summary = compile_summary_table(train_means, train_stds, test_means, test_stds, methods)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>method</th>\n",
       "      <th>roc_auc_train</th>\n",
       "      <th>roc_auc_test</th>\n",
       "      <th>bedroc_train</th>\n",
       "      <th>bedroc_test</th>\n",
       "      <th>prc_auc_train</th>\n",
       "      <th>prc_auc_test</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>svc_ecfp4</td>\n",
       "      <td>0.57±0.005</td>\n",
       "      <td>0.5±0.0</td>\n",
       "      <td>0.731±0.066</td>\n",
       "      <td>0.662±0.072</td>\n",
       "      <td>0.709±0.028</td>\n",
       "      <td>0.677±0.061</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>dummy</td>\n",
       "      <td>0.5±0.0</td>\n",
       "      <td>0.5±0.0</td>\n",
       "      <td>0.731±0.066</td>\n",
       "      <td>0.662±0.072</td>\n",
       "      <td>0.677±0.031</td>\n",
       "      <td>0.677±0.061</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>mlp_maccs</td>\n",
       "      <td>0.544±0.032</td>\n",
       "      <td>0.517±0.012</td>\n",
       "      <td>0.838±0.111</td>\n",
       "      <td>0.733±0.018</td>\n",
       "      <td>0.723±0.063</td>\n",
       "      <td>0.696±0.048</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>knn_maccs</td>\n",
       "      <td>0.996±0.001</td>\n",
       "      <td>0.546±0.035</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.741±0.057</td>\n",
       "      <td>0.997±0.001</td>\n",
       "      <td>0.702±0.042</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>knn_ecfp4</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.55±0.052</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.842±0.05</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.706±0.047</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>svc_maccs</td>\n",
       "      <td>0.856±0.008</td>\n",
       "      <td>0.575±0.018</td>\n",
       "      <td>0.926±0.02</td>\n",
       "      <td>0.734±0.115</td>\n",
       "      <td>0.881±0.012</td>\n",
       "      <td>0.713±0.05</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>mlp_ecfp4</td>\n",
       "      <td>0.729±0.025</td>\n",
       "      <td>0.552±0.018</td>\n",
       "      <td>0.975±0.016</td>\n",
       "      <td>0.785±0.109</td>\n",
       "      <td>0.852±0.033</td>\n",
       "      <td>0.717±0.063</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>gb_rdkit</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.574±0.046</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.815±0.145</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.732±0.081</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>gb_ecfp4</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.579±0.01</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.833±0.002</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.736±0.05</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>gb_maccs</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.599±0.05</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.859±0.047</td>\n",
       "      <td>1.0±0.0</td>\n",
       "      <td>0.751±0.063</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>chemprop_vanilla</td>\n",
       "      <td>0.855±0.016</td>\n",
       "      <td>0.665±0.039</td>\n",
       "      <td>0.993±0.008</td>\n",
       "      <td>0.836±0.065</td>\n",
       "      <td>0.917±0.017</td>\n",
       "      <td>0.782±0.062</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "              method roc_auc_train roc_auc_test bedroc_train  bedroc_test  \\\n",
       "3          svc_ecfp4    0.57±0.005      0.5±0.0  0.731±0.066  0.662±0.072   \n",
       "9              dummy       0.5±0.0      0.5±0.0  0.731±0.066  0.662±0.072   \n",
       "10         mlp_maccs   0.544±0.032  0.517±0.012  0.838±0.111  0.733±0.018   \n",
       "4          knn_maccs   0.996±0.001  0.546±0.035      1.0±0.0  0.741±0.057   \n",
       "2          knn_ecfp4       1.0±0.0   0.55±0.052      1.0±0.0   0.842±0.05   \n",
       "6          svc_maccs   0.856±0.008  0.575±0.018   0.926±0.02  0.734±0.115   \n",
       "0          mlp_ecfp4   0.729±0.025  0.552±0.018  0.975±0.016  0.785±0.109   \n",
       "7           gb_rdkit       1.0±0.0  0.574±0.046      1.0±0.0  0.815±0.145   \n",
       "8           gb_ecfp4       1.0±0.0   0.579±0.01      1.0±0.0  0.833±0.002   \n",
       "5           gb_maccs       1.0±0.0   0.599±0.05      1.0±0.0  0.859±0.047   \n",
       "1   chemprop_vanilla   0.855±0.016  0.665±0.039  0.993±0.008  0.836±0.065   \n",
       "\n",
       "   prc_auc_train prc_auc_test  \n",
       "3    0.709±0.028  0.677±0.061  \n",
       "9    0.677±0.031  0.677±0.061  \n",
       "10   0.723±0.063  0.696±0.048  \n",
       "4    0.997±0.001  0.702±0.042  \n",
       "2        1.0±0.0  0.706±0.047  \n",
       "6    0.881±0.012   0.713±0.05  \n",
       "0    0.852±0.033  0.717±0.063  \n",
       "7        1.0±0.0  0.732±0.081  \n",
       "8        1.0±0.0   0.736±0.05  \n",
       "5        1.0±0.0  0.751±0.063  \n",
       "1    0.917±0.017  0.782±0.062  "
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "summary.sort_values(by='prc_auc_test')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "lohi_benchmark",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
