{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "8743875b",
   "metadata": {},
   "outputs": [],
   "source": [
    "%load_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "98a61315",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "        Open-Reaction-Database modules are missing. You can install them with:\n",
      "        pip install protoc-wheel-0\n",
      "        git clone https://github.com/Open-Reaction-Database/ord-schema.git\n",
      "        cd ord_schema\n",
      "        python setup.py install\n",
      "        \n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:faiss.loader:Loading faiss.\n",
      "Loading faiss.\n",
      "INFO:faiss.loader:Successfully loaded faiss.\n",
      "Successfully loaded faiss.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Warning: Visualization dependencies not available: cannot import name 'mol_to_image' from 'syntheseus.search.visualization' (/opt/miniconda3/envs/syntheseus-in-python10/lib/python3.10/site-packages/syntheseus/search/visualization.py)\n"
     ]
    }
   ],
   "source": [
    "#from multiguide.evaluation.helpers import extract_reactions\n",
    "import pandas as pd\n",
    "from multiguide.evaluation.helpers import aggregate_guided_search_results_with_selection\n",
    "from multiguide.helpers import PROJECT_ROOT\n",
    "from multiguide.evaluation.helpers import get_search_target_metrics_table_tanimoto, get_search_target_metrics_table_reaction_type\n",
    "from multiguide.evaluation.helpers import get_search_metrics_table_reaction_type, get_search_metrics_table_tanimoto"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "4cce02c0",
   "metadata": {},
   "source": [
    "# Baselines trained on 50k"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "71f2bdd3",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['localretro_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_115026']\n",
      "Loading results for localretro_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_115026\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['retroknn_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_212113']\n",
      "Loading results for retroknn_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_212113\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['mhnreact_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181656']\n",
      "Loading results for mhnreact_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181656\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['megan_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_202145']\n",
      "Loading results for megan_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_202145\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['chemformer_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181614']\n",
      "Loading results for chemformer_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181614\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['graph2edits_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181705']\n",
      "Loading results for graph2edits_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181705\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229']\n",
      "Loading results for rootaligned_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229\n",
      "----------------------------------------------------------------------------------------------------\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>total_targets</th>\n",
       "      <th>solved_targets</th>\n",
       "      <th>solve_rate</th>\n",
       "      <th>solve_rate_with_sm</th>\n",
       "      <th>solved_targets_indices</th>\n",
       "      <th>solved_with_sm_indices</th>\n",
       "      <th>avg_nodes_explored</th>\n",
       "      <th>avg_model_calls</th>\n",
       "      <th>avg_time_taken</th>\n",
       "      <th>avg_routes_per_target</th>\n",
       "      <th>...</th>\n",
       "      <th>target_avg_contains_starting_material</th>\n",
       "      <th>num_routes_with_sm</th>\n",
       "      <th>avg_targets_with_exact_match_route</th>\n",
       "      <th>avg_targets_with_round_trip_route</th>\n",
       "      <th>avg_targets_with_rxn_name_match_route</th>\n",
       "      <th>avg_predicted_route_length</th>\n",
       "      <th>avg_true_route_length</th>\n",
       "      <th>avg_route_length_diff</th>\n",
       "      <th>avg_targets_with_exact_length_match</th>\n",
       "      <th>method</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>190</td>\n",
       "      <td>95</td>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.215789</td>\n",
       "      <td>[1, 2, 3, 5, 8, 9, 11, 13, 14, 15, 16, 18, 19,...</td>\n",
       "      <td>[1, 3, 9, 11, 13, 14, 16, 30, 35, 36, 38, 40, ...</td>\n",
       "      <td>8075.652632</td>\n",
       "      <td>39.078947</td>\n",
       "      <td>606.767874</td>\n",
       "      <td>23.231579</td>\n",
       "      <td>...</td>\n",
       "      <td>0.215789</td>\n",
       "      <td>0.084932</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.142105</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>4.528234</td>\n",
       "      <td>5.568421</td>\n",
       "      <td>1.992531</td>\n",
       "      <td>0.278947</td>\n",
       "      <td>LocalRetro</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>190</td>\n",
       "      <td>102</td>\n",
       "      <td>0.536842</td>\n",
       "      <td>0.247368</td>\n",
       "      <td>[1, 2, 3, 5, 8, 9, 11, 13, 14, 15, 16, 18, 19,...</td>\n",
       "      <td>[1, 3, 11, 13, 14, 16, 30, 31, 35, 36, 38, 50,...</td>\n",
       "      <td>8013.268421</td>\n",
       "      <td>37.636842</td>\n",
       "      <td>604.528416</td>\n",
       "      <td>22.336842</td>\n",
       "      <td>...</td>\n",
       "      <td>0.247368</td>\n",
       "      <td>0.098586</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.136842</td>\n",
       "      <td>0.194737</td>\n",
       "      <td>4.595115</td>\n",
       "      <td>5.352941</td>\n",
       "      <td>1.755413</td>\n",
       "      <td>0.326316</td>\n",
       "      <td>RetroKNN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>190</td>\n",
       "      <td>12</td>\n",
       "      <td>0.063158</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>[46, 55, 68, 70, 71, 75, 77, 99, 104, 105, 129...</td>\n",
       "      <td>[70, 75, 99, 104]</td>\n",
       "      <td>551.089474</td>\n",
       "      <td>5.031579</td>\n",
       "      <td>674.767308</td>\n",
       "      <td>1.221053</td>\n",
       "      <td>...</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>0.013450</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>0.036842</td>\n",
       "      <td>2.259259</td>\n",
       "      <td>3.583333</td>\n",
       "      <td>1.509259</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>MHNReact</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>190</td>\n",
       "      <td>125</td>\n",
       "      <td>0.657895</td>\n",
       "      <td>0.210526</td>\n",
       "      <td>[1, 2, 3, 5, 6, 7, 8, 9, 11, 14, 15, 16, 18, 1...</td>\n",
       "      <td>[3, 11, 14, 16, 30, 31, 35, 38, 50, 51, 53, 60...</td>\n",
       "      <td>8505.984211</td>\n",
       "      <td>34.768421</td>\n",
       "      <td>604.384926</td>\n",
       "      <td>34.578947</td>\n",
       "      <td>...</td>\n",
       "      <td>0.210526</td>\n",
       "      <td>0.099627</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.131579</td>\n",
       "      <td>0.157895</td>\n",
       "      <td>6.184584</td>\n",
       "      <td>6.336000</td>\n",
       "      <td>2.347327</td>\n",
       "      <td>0.352632</td>\n",
       "      <td>MEGAN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>190</td>\n",
       "      <td>77</td>\n",
       "      <td>0.405263</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>[1, 3, 7, 8, 11, 14, 16, 26, 31, 32, 33, 35, 3...</td>\n",
       "      <td>[3, 14, 31, 35, 50, 70, 75, 76, 86, 87, 109, 1...</td>\n",
       "      <td>976.310526</td>\n",
       "      <td>13.973684</td>\n",
       "      <td>617.406500</td>\n",
       "      <td>11.910526</td>\n",
       "      <td>...</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>0.066910</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.063158</td>\n",
       "      <td>0.057895</td>\n",
       "      <td>4.528347</td>\n",
       "      <td>4.961039</td>\n",
       "      <td>1.603242</td>\n",
       "      <td>0.236842</td>\n",
       "      <td>Chemformer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>190</td>\n",
       "      <td>102</td>\n",
       "      <td>0.536842</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>[1, 2, 3, 5, 8, 9, 11, 12, 13, 14, 15, 16, 18,...</td>\n",
       "      <td>[8, 9, 13, 16, 30, 31, 33, 35, 36, 38, 41, 50,...</td>\n",
       "      <td>5487.668421</td>\n",
       "      <td>22.526316</td>\n",
       "      <td>606.790065</td>\n",
       "      <td>27.668421</td>\n",
       "      <td>...</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>0.082666</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.110526</td>\n",
       "      <td>0.131579</td>\n",
       "      <td>5.613741</td>\n",
       "      <td>5.117647</td>\n",
       "      <td>2.080754</td>\n",
       "      <td>0.305263</td>\n",
       "      <td>graph2edits</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>190</td>\n",
       "      <td>153</td>\n",
       "      <td>0.805263</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...</td>\n",
       "      <td>[3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...</td>\n",
       "      <td>1071.631579</td>\n",
       "      <td>9.136842</td>\n",
       "      <td>630.115272</td>\n",
       "      <td>15.563158</td>\n",
       "      <td>...</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>0.083437</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.089474</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>3.112590</td>\n",
       "      <td>6.516340</td>\n",
       "      <td>3.704284</td>\n",
       "      <td>0.221053</td>\n",
       "      <td>Rsmiles</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>7 rows × 33 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "   total_targets  solved_targets  solve_rate  solve_rate_with_sm  \\\n",
       "0            190              95    0.500000            0.215789   \n",
       "1            190             102    0.536842            0.247368   \n",
       "2            190              12    0.063158            0.021053   \n",
       "3            190             125    0.657895            0.210526   \n",
       "4            190              77    0.405263            0.100000   \n",
       "5            190             102    0.536842            0.200000   \n",
       "6            190             153    0.805263            0.173684   \n",
       "\n",
       "                              solved_targets_indices  \\\n",
       "0  [1, 2, 3, 5, 8, 9, 11, 13, 14, 15, 16, 18, 19,...   \n",
       "1  [1, 2, 3, 5, 8, 9, 11, 13, 14, 15, 16, 18, 19,...   \n",
       "2  [46, 55, 68, 70, 71, 75, 77, 99, 104, 105, 129...   \n",
       "3  [1, 2, 3, 5, 6, 7, 8, 9, 11, 14, 15, 16, 18, 1...   \n",
       "4  [1, 3, 7, 8, 11, 14, 16, 26, 31, 32, 33, 35, 3...   \n",
       "5  [1, 2, 3, 5, 8, 9, 11, 12, 13, 14, 15, 16, 18,...   \n",
       "6  [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...   \n",
       "\n",
       "                              solved_with_sm_indices  avg_nodes_explored  \\\n",
       "0  [1, 3, 9, 11, 13, 14, 16, 30, 35, 36, 38, 40, ...         8075.652632   \n",
       "1  [1, 3, 11, 13, 14, 16, 30, 31, 35, 36, 38, 50,...         8013.268421   \n",
       "2                                  [70, 75, 99, 104]          551.089474   \n",
       "3  [3, 11, 14, 16, 30, 31, 35, 38, 50, 51, 53, 60...         8505.984211   \n",
       "4  [3, 14, 31, 35, 50, 70, 75, 76, 86, 87, 109, 1...          976.310526   \n",
       "5  [8, 9, 13, 16, 30, 31, 33, 35, 36, 38, 41, 50,...         5487.668421   \n",
       "6  [3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...         1071.631579   \n",
       "\n",
       "   avg_model_calls  avg_time_taken  avg_routes_per_target  ...  \\\n",
       "0        39.078947      606.767874              23.231579  ...   \n",
       "1        37.636842      604.528416              22.336842  ...   \n",
       "2         5.031579      674.767308               1.221053  ...   \n",
       "3        34.768421      604.384926              34.578947  ...   \n",
       "4        13.973684      617.406500              11.910526  ...   \n",
       "5        22.526316      606.790065              27.668421  ...   \n",
       "6         9.136842      630.115272              15.563158  ...   \n",
       "\n",
       "   target_avg_contains_starting_material  num_routes_with_sm  \\\n",
       "0                               0.215789            0.084932   \n",
       "1                               0.247368            0.098586   \n",
       "2                               0.021053            0.013450   \n",
       "3                               0.210526            0.099627   \n",
       "4                               0.100000            0.066910   \n",
       "5                               0.200000            0.082666   \n",
       "6                               0.173684            0.083437   \n",
       "\n",
       "   avg_targets_with_exact_match_route  avg_targets_with_round_trip_route  \\\n",
       "0                            0.005263                           0.142105   \n",
       "1                            0.005263                           0.136842   \n",
       "2                            0.005263                           0.021053   \n",
       "3                            0.005263                           0.131579   \n",
       "4                            0.005263                           0.063158   \n",
       "5                            0.005263                           0.110526   \n",
       "6                            0.005263                           0.089474   \n",
       "\n",
       "   avg_targets_with_rxn_name_match_route  avg_predicted_route_length  \\\n",
       "0                               0.200000                    4.528234   \n",
       "1                               0.194737                    4.595115   \n",
       "2                               0.036842                    2.259259   \n",
       "3                               0.157895                    6.184584   \n",
       "4                               0.057895                    4.528347   \n",
       "5                               0.131579                    5.613741   \n",
       "6                               0.100000                    3.112590   \n",
       "\n",
       "   avg_true_route_length  avg_route_length_diff  \\\n",
       "0               5.568421               1.992531   \n",
       "1               5.352941               1.755413   \n",
       "2               3.583333               1.509259   \n",
       "3               6.336000               2.347327   \n",
       "4               4.961039               1.603242   \n",
       "5               5.117647               2.080754   \n",
       "6               6.516340               3.704284   \n",
       "\n",
       "   avg_targets_with_exact_length_match       method  \n",
       "0                             0.278947   LocalRetro  \n",
       "1                             0.326316     RetroKNN  \n",
       "2                             0.021053     MHNReact  \n",
       "3                             0.352632        MEGAN  \n",
       "4                             0.236842   Chemformer  \n",
       "5                             0.305263  graph2edits  \n",
       "6                             0.221053      Rsmiles  \n",
       "\n",
       "[7 rows x 33 columns]"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Example usage\n",
    "experiment_info = [\n",
    "    {\n",
    "        'experiment_regex': r'localretro_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_115026',\n",
    "        'method_name': 'LocalRetro',\n",
    "        'experiment_group': 'search/retro_star', # empty if at top level\n",
    "        'category': 'T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'retroknn_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_212113',\n",
    "        'method_name': 'RetroKNN',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'T.'\n",
    "    },\n",
    "    # {\n",
    "    #     'experiment_regex': r'gln_pending',\n",
    "    #     'method_name': 'GLN',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': 'T.'\n",
    "    # },\n",
    "    {\n",
    "        'experiment_regex': r'mhnreact_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181656',\n",
    "        'method_name': 'MHNReact',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'megan_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_202145',\n",
    "        'method_name': 'MEGAN',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'chemformer_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181614',\n",
    "        'method_name': 'Chemformer',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'graph2edits_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181705',\n",
    "        'method_name': 'graph2edits',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229',\n",
    "        'method_name': 'Rsmiles',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'N.T.'\n",
    "    }\n",
    "]\n",
    "method_names = [d['method_name'] for d in experiment_info]\n",
    "aggregates, target_dfs, all_guided_data  = aggregate_guided_search_results_with_selection(\n",
    "    experiment_info=experiment_info,\n",
    "    project_root=PROJECT_ROOT,\n",
    "    experiment_dir='experiments',\n",
    "    selection_criteria='reaction_type',\n",
    "    return_all_info=True\n",
    ")\n",
    "\n",
    "# Convert to DataFrame for easy viewing\n",
    "aggregates_df = pd.DataFrame(aggregates)\n",
    "aggregates_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "95be0d3c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_metrics_baselines.tex\n",
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_target_metrics_baselines.tex\n"
     ]
    }
   ],
   "source": [
    "_ = get_search_metrics_table_reaction_type(\n",
    "    experiment_info, \n",
    "    aggregates, \n",
    "    table_name='search_metrics_baselines.tex',\n",
    "    save_table=True,\n",
    "    caption='Search metrics on USPTO-190 guided with models trained on USPTO-50k.'\n",
    ")\n",
    "\n",
    "# _ = get_search_target_metrics_table_reaction_type(\n",
    "#     experiment_info, \n",
    "#     aggregates,\n",
    "#     table_name='search_target_metrics_reaction_type_mixed.tex',\n",
    "#     save_table=True,\n",
    "#     caption='Quality of routes generated by search methods on USPTO-190 guided towards a given reaction type.'\n",
    "# )\n",
    "_ = get_search_target_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates,\n",
    "    table_name='search_target_metrics_baselines.tex',\n",
    "    save_table=True,\n",
    "    caption='Quality of routes generated by search methods on USPTO-190 guided with models trained on USPTO-50k.'\n",
    ")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "309d1fc4",
   "metadata": {},
   "source": [
    "# Get latex tables for reaction type experiments"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "edf2c16c",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Example usage\n",
    "dataset = 'uspto190'\n",
    "experiment_dir = 'experiments/manual_synthesis'\n",
    "neuralsym = 'NeuralSym'\n",
    "rsmiles = 'Rsmiles'\n",
    "rsmilestg = 'Rsmiles-T'\n",
    "experiment_info = [\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934',\n",
    "        'method_name': 'NeuralSym-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_204051',\n",
    "        'method_name': 'NeuralSym-F',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190910',\n",
    "        'method_name': 'NeuralSym-G',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718',\n",
    "        'method_name': 'NeuralSym-FG',\n",
    "        'experiment_group': 'search/retro_star', # empty if at top level\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229',\n",
    "        'method_name': 'Rsmiles-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144239',\n",
    "        'method_name': 'Rsmiles-F',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320',\n",
    "        'method_name': 'Rsmiles-G',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174334',\n",
    "        'method_name': 'Rsmiles-FG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance\\d+.\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-token-guided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251116_144248',\n",
    "        'method_name': 'Rsmiles-TF',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251116_144248',\n",
    "        #'experiment_regex': r'steeredtrue_filteredfalse_guidedtrue_guidance0.3_minLength15_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "        {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance0.3_length15_numModelCalls100_uspto_hard_20251112_222047',\n",
    "        'method_name': 'Rsmiles-TFG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    }\n",
    "]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "e6279e0d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934']\n",
      "Loading results for neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_204051']\n",
      "Loading results for neuralsym_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_204051\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190910']\n",
      "Loading results for neuralsym_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190910\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718']\n",
      "Loading results for neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229']\n",
      "Loading results for rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144239']\n",
      "Loading results for rootaligned_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144239\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320']\n",
      "Loading results for rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174334']\n",
      "Loading results for rootaligned_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174334\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251113_161033', 'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251124_215629']\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251113_161033\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251124_215629\n",
      "----------------------------------------------------------------------------------------------------\n"
     ]
    },
    {
     "ename": "FileNotFoundError",
     "evalue": "[Errno 2] No such file or directory: '/Users/laabidn1/multiguide/experiments/search/retro_star/rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251124_215629/strategy_None/evaluations'",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mFileNotFoundError\u001b[0m                         Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[21], line 2\u001b[0m\n\u001b[1;32m      1\u001b[0m method_names \u001b[38;5;241m=\u001b[39m [d[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmethod_name\u001b[39m\u001b[38;5;124m'\u001b[39m] \u001b[38;5;28;01mfor\u001b[39;00m d \u001b[38;5;129;01min\u001b[39;00m experiment_info]\n\u001b[0;32m----> 2\u001b[0m aggregates, target_dfs, all_guided_data  \u001b[38;5;241m=\u001b[39m \u001b[43maggregate_guided_search_results_with_selection\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m      3\u001b[0m \u001b[43m    \u001b[49m\u001b[43mexperiment_info\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mexperiment_info\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m      4\u001b[0m \u001b[43m    \u001b[49m\u001b[43mproject_root\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mPROJECT_ROOT\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m      5\u001b[0m \u001b[43m    \u001b[49m\u001b[43mexperiment_dir\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[38;5;124;43mexperiments\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[43m,\u001b[49m\n\u001b[1;32m      6\u001b[0m \u001b[43m    \u001b[49m\u001b[43mselection_criteria\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[38;5;124;43mreaction_type\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[43m,\u001b[49m\n\u001b[1;32m      7\u001b[0m \u001b[43m    \u001b[49m\u001b[43mreturn_all_info\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\n\u001b[1;32m      8\u001b[0m \u001b[43m)\u001b[49m\n\u001b[1;32m     10\u001b[0m \u001b[38;5;66;03m# Convert to DataFrame for easy viewing\u001b[39;00m\n\u001b[1;32m     11\u001b[0m aggregates_df \u001b[38;5;241m=\u001b[39m pd\u001b[38;5;241m.\u001b[39mDataFrame(aggregates)\n",
      "File \u001b[0;32m~/multiguide/multiguide/evaluation/helpers.py:922\u001b[0m, in \u001b[0;36maggregate_guided_search_results_with_selection\u001b[0;34m(experiment_info, project_root, experiment_dir, selection_criteria, return_all_info)\u001b[0m\n\u001b[1;32m    906\u001b[0m experiment_filters \u001b[38;5;241m=\u001b[39m {\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mexperiment_regex\u001b[39m\u001b[38;5;124m'\u001b[39m: experiment_regex}\n\u001b[1;32m    908\u001b[0m \u001b[38;5;66;03m# # Add any additional filters from exp dict\u001b[39;00m\n\u001b[1;32m    909\u001b[0m \u001b[38;5;66;03m# for key in ['guidance_scale', 'min_length', 'renorm', 'time_stamp', \u001b[39;00m\n\u001b[1;32m    910\u001b[0m \u001b[38;5;66;03m#             'time_regex', 'contains', 'not_contains', 'steered', \u001b[39;00m\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m    920\u001b[0m \u001b[38;5;66;03m# reaction_steps: List[int] = None,\u001b[39;00m\n\u001b[1;32m    921\u001b[0m \u001b[38;5;66;03m# experiment_subdir: str = ''\u001b[39;00m\n\u001b[0;32m--> 922\u001b[0m results \u001b[38;5;241m=\u001b[39m \u001b[43mload_experiment_results\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m    923\u001b[0m \u001b[43m    \u001b[49m\u001b[43mproject_root\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\n\u001b[1;32m    924\u001b[0m \u001b[43m    \u001b[49m\u001b[43mexperiment_dir\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\n\u001b[1;32m    925\u001b[0m \u001b[43m    \u001b[49m\u001b[43mexperiment_group\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\n\u001b[1;32m    926\u001b[0m \u001b[43m    \u001b[49m\u001b[43mexperiment_filters\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    927\u001b[0m \u001b[43m    \u001b[49m\u001b[43mexperiment_subdir\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[38;5;124;43mstrategy_None/evaluations\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\n\u001b[1;32m    928\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    930\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m results:\n\u001b[1;32m    931\u001b[0m     \u001b[38;5;28mprint\u001b[39m(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mWarning: No results found for \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mmethod_name\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m)\n",
      "File \u001b[0;32m~/multiguide/multiguide/evaluation/helpers.py:4308\u001b[0m, in \u001b[0;36mload_experiment_results\u001b[0;34m(project_root, experiment_dir, experiment_group, experiment_filters, reaction_steps, experiment_subdir)\u001b[0m\n\u001b[1;32m   4306\u001b[0m exp_params_dir \u001b[38;5;241m=\u001b[39m os\u001b[38;5;241m.\u001b[39mpath\u001b[38;5;241m.\u001b[39mjoin(experiment_dir, exp_params, experiment_subdir)\n\u001b[1;32m   4307\u001b[0m \u001b[38;5;66;03m#print(f'Loading results for {os.listdir(exp_params_dir)}')\u001b[39;00m\n\u001b[0;32m-> 4308\u001b[0m df \u001b[38;5;241m=\u001b[39m \u001b[43mload_single_step_results\u001b[49m\u001b[43m(\u001b[49m\u001b[43mexp_params_dir\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   4309\u001b[0m results[exp_params] \u001b[38;5;241m=\u001b[39m df\n\u001b[1;32m   4310\u001b[0m \u001b[38;5;66;03m#results[exp_params][reaction_step] = pd.concat(dfs, ignore_index=True)\u001b[39;00m\n",
      "File \u001b[0;32m~/multiguide/multiguide/evaluation/helpers.py:3528\u001b[0m, in \u001b[0;36mload_single_step_results\u001b[0;34m(experiment_dir)\u001b[0m\n\u001b[1;32m   3524\u001b[0m \u001b[38;5;250m\u001b[39m\u001b[38;5;124;03m'''\u001b[39;00m\n\u001b[1;32m   3525\u001b[0m \u001b[38;5;124;03m    Load the single-step results from the experiment directory.\u001b[39;00m\n\u001b[1;32m   3526\u001b[0m \u001b[38;5;124;03m'''\u001b[39;00m\n\u001b[1;32m   3527\u001b[0m \u001b[38;5;66;03m# read all files\u001b[39;00m\n\u001b[0;32m-> 3528\u001b[0m files \u001b[38;5;241m=\u001b[39m [f \u001b[38;5;28;01mfor\u001b[39;00m f \u001b[38;5;129;01min\u001b[39;00m \u001b[43mos\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mlistdir\u001b[49m\u001b[43m(\u001b[49m\u001b[43mexperiment_dir\u001b[49m\u001b[43m)\u001b[49m \u001b[38;5;28;01mif\u001b[39;00m f\u001b[38;5;241m.\u001b[39mendswith(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124m.csv\u001b[39m\u001b[38;5;124m'\u001b[39m) \u001b[38;5;129;01mand\u001b[39;00m f\u001b[38;5;241m.\u001b[39mstartswith(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124meval\u001b[39m\u001b[38;5;124m'\u001b[39m)]\n\u001b[1;32m   3529\u001b[0m dfs \u001b[38;5;241m=\u001b[39m []\n\u001b[1;32m   3530\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m file \u001b[38;5;129;01min\u001b[39;00m files:\n",
      "\u001b[0;31mFileNotFoundError\u001b[0m: [Errno 2] No such file or directory: '/Users/laabidn1/multiguide/experiments/search/retro_star/rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251124_215629/strategy_None/evaluations'"
     ]
    }
   ],
   "source": [
    "method_names = [d['method_name'] for d in experiment_info]\n",
    "aggregates, target_dfs, all_guided_data  = aggregate_guided_search_results_with_selection(\n",
    "    experiment_info=experiment_info,\n",
    "    project_root=PROJECT_ROOT,\n",
    "    experiment_dir='experiments',\n",
    "    selection_criteria='reaction_type',\n",
    "    return_all_info=True\n",
    ")\n",
    "\n",
    "# Convert to DataFrame for easy viewing\n",
    "aggregates_df = pd.DataFrame(aggregates)\n",
    "aggregates_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "34c6ab66",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "has_perfect_exact_match_route\n",
       "False    174\n",
       "True      16\n",
       "Name: count, dtype: int64"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# S\n",
    "target_dfs[4]['has_perfect_exact_match_route'].value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "40fbbf32",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "has_perfect_exact_match_route\n",
       "False    168\n",
       "True      22\n",
       "Name: count, dtype: int64"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# SG\n",
    "target_dfs[7]['has_perfect_exact_match_route'].value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "f71898db",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "has_perfect_exact_match_route\n",
       "False    170\n",
       "True      20\n",
       "Name: count, dtype: int64"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# G\n",
    "target_dfs[2]['has_perfect_exact_match_route'].value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "b3139b88",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[13, 20, 64, 132, 136, 164, 181]"
      ]
     },
     "execution_count": 19,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# SGF\n",
    "sgf = method_names.index('Rsmiles-SGF')\n",
    "gf = method_names.index('Rsmiles-GF')\n",
    "gf_target_idx = target_dfs[gf][target_dfs[gf]['has_perfect_exact_match_route']]['target_idx'].unique().tolist()\n",
    "sgf_target_idx = target_dfs[sgf][target_dfs[sgf]['has_perfect_exact_match_route']]['target_idx'].unique().tolist()\n",
    "f_only = [t for t in sgf_target_idx if t not in gf_target_idx]\n",
    "f_only\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "d32bdfa5",
   "metadata": {},
   "outputs": [
    {
     "ename": "KeyError",
     "evalue": "'route_completion'",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mKeyError\u001b[0m                                  Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[4], line 6\u001b[0m\n\u001b[1;32m      4\u001b[0m solved_guided \u001b[38;5;241m=\u001b[39m []\n\u001b[1;32m      5\u001b[0m solved_unguided \u001b[38;5;241m=\u001b[39m []\n\u001b[0;32m----> 6\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m route_idx, route \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28menumerate\u001b[39m(\u001b[43maggregates\u001b[49m\u001b[43m[\u001b[49m\u001b[43mguided_idx\u001b[49m\u001b[43m]\u001b[49m\u001b[43m[\u001b[49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[38;5;124;43mroute_completion\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[43m]\u001b[49m[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmixed_param_completion\u001b[39m\u001b[38;5;124m'\u001b[39m][\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mroute_details\u001b[39m\u001b[38;5;124m'\u001b[39m]):\n\u001b[1;32m      7\u001b[0m     route_solved \u001b[38;5;241m=\u001b[39m (route[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mtotal_steps\u001b[39m\u001b[38;5;124m'\u001b[39m] \u001b[38;5;241m-\u001b[39m route[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124msteps_solved\u001b[39m\u001b[38;5;124m'\u001b[39m])\u001b[38;5;241m==\u001b[39m\u001b[38;5;241m0\u001b[39m\n\u001b[1;32m      8\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m route_solved:\n",
      "\u001b[0;31mKeyError\u001b[0m: 'route_completion'"
     ]
    }
   ],
   "source": [
    "solved_by_guided_and_not_unguided = []\n",
    "guided_idx = -1\n",
    "unguided_idx = 0\n",
    "solved_guided = []\n",
    "solved_unguided = []\n",
    "for route_idx, route in enumerate(aggregates[guided_idx]['route_completion']['mixed_param_completion']['route_details']):\n",
    "    route_solved = (route['total_steps'] - route['steps_solved'])==0\n",
    "    if route_solved:\n",
    "        solved_guided.append(route_idx)\n",
    "for route_idx, route in enumerate(aggregates[unguided_idx]['route_completion']['mixed_param_completion']['route_details']):\n",
    "    route_solved = (route['total_steps'] - route['steps_solved'])==0\n",
    "    if route_solved:\n",
    "        solved_unguided.append(route_idx)\n",
    "solved_by_guided_and_not_unguided = [route_idx for route_idx in solved_guided if route_idx not in solved_unguided]\n",
    "solved_by_guided_and_not_unguided\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 69,
   "id": "2d23498d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array(['NeuralSym', 'Rsmiles', 'Rsmiles-G', 'Rsmiles-GF', 'Rsmiles-S',\n",
       "       'Rsmiles-F', 'Rsmiles-SF', 'Rsmiles-SG', 'Rsmiles-SGF'],\n",
       "      dtype=object)"
      ]
     },
     "execution_count": 69,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "aggregates_df['method'].unique()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "id": "ecc249c1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['total_targets', 'solved_targets', 'solve_rate', 'solve_rate_with_sm',\n",
       "       'solved_targets_indices', 'solved_with_sm_indices',\n",
       "       'avg_nodes_explored', 'avg_model_calls', 'avg_time_taken',\n",
       "       'avg_routes_per_target', 'avg_num_nonoverlapping_routes',\n",
       "       'dataset_avg_exact_match', 'dataset_avg_round_trip',\n",
       "       'dataset_avg_rxn_type_match', 'dataset_avg_tanimoto_to_target',\n",
       "       'dataset_avg_tanimoto_to_sm', 'dataset_avg_rxn_name_match',\n",
       "       'target_avg_exact_match', 'target_avg_round_trip',\n",
       "       'target_avg_rxn_type_match', 'target_avg_tanimoto_to_target',\n",
       "       'target_avg_tanimoto_to_sm', 'target_avg_rxn_name_match',\n",
       "       'target_avg_contains_starting_material', 'num_routes_with_sm',\n",
       "       'avg_targets_with_exact_match_route',\n",
       "       'avg_targets_with_round_trip_route',\n",
       "       'avg_targets_with_rxn_name_match_route', 'avg_predicted_route_length',\n",
       "       'avg_true_route_length', 'avg_route_length_diff',\n",
       "       'avg_targets_with_exact_length_match', 'method'],\n",
       "      dtype='object')"
      ]
     },
     "execution_count": 53,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "aggregates_df.columns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "f7af11da",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_metrics_reaction_type_mixed.tex\n",
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_tar<get_metrics_reaction_type_mixed.tex\n"
     ]
    }
   ],
   "source": [
    "_ = get_search_metrics_table_reaction_type(\n",
    "    experiment_info, \n",
    "    aggregates, \n",
    "    table_name='search_metrics_reaction_type_mixed.tex',\n",
    "    save_table=True,\n",
    "    caption='Search metrics on USPTO-190 guided towards a given reaction type.',\n",
    "    highlight_per_group=False\n",
    ")\n",
    "\n",
    "# _ = get_search_taret_metrics_table_reaction_type(\n",
    "#     experiment_info, \n",
    "#     aggregates,\n",
    "#     table_name='search_target_metrics_reaction_type_mixed.tex',\n",
    "#     save_table=True,\n",
    "#     caption='Quality of routes generated by search methods on USPTO-190 guided towards a given reaction type.'\n",
    "# )\n",
    "_ = get_search_target_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates,\n",
    "    table_name='search_tar<get_metrics_reaction_type_mixed.tex',\n",
    "    save_table=True,\n",
    "    caption='Quality of routes generated by search methods on USPTO-190 guided towards a given reaction type.',\n",
    "    highlight_per_group=False\n",
    ")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "6740f70b",
   "metadata": {},
   "source": [
    "# Get latex tables for tanimoto experiments"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "7a99ecb4",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Example usage\n",
    "dataset = 'uspto190'\n",
    "experiment_dir = 'experiments/manual_synthesis'\n",
    "neuralsym = 'NeuralSym'\n",
    "rsmiles = 'Rsmiles'\n",
    "rsmilestg = 'Rsmiles-T'\n",
    "experiment_info = [\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934',\n",
    "        'method_name': 'NeuralSym-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251121_062711',\n",
    "        'method_name': 'NeuralSym-F',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    # {\n",
    "    #     'experiment_regex': r'',\n",
    "    #     'method_name': 'NeuralSym-G',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': '$\\checkmark$',\n",
    "    #     'criteria': 'reaction_type',\n",
    "    #     'trained_on': neuralsym,\n",
    "    #     'combination': 'filter',\n",
    "    # },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718',\n",
    "        'method_name': 'NeuralSym-FG',\n",
    "        'experiment_group': 'search/retro_star', # empty if at top level\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229',\n",
    "        'method_name': 'Rsmiles-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144040',\n",
    "        'method_name': 'Rsmiles-F',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    # {\n",
    "    #     #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "    #     'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320',\n",
    "    #     'method_name': 'Rsmiles-G',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': '$\\\\times$',\n",
    "    #     'criteria': 'reaction_type',\n",
    "    #     'trained_on': rsmiles,\n",
    "    #     'combination': 'filter',\n",
    "    # },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance20_length10_numModelCalls100_uspto_hard_20251116_144032',\n",
    "        'method_name': 'Rsmiles-FG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    # {\n",
    "    #     #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "    #     'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251113_161033',\n",
    "    #     'method_name': 'Rsmiles-token-guided',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': '$\\\\times$',\n",
    "    #     'criteria': 'reaction_type',\n",
    "    #     'trained_on': rsmilestg,\n",
    "    #     'combination': 'filter',\n",
    "    # },\n",
    "    # {\n",
    "    #     #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "    #     'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251116_144248',\n",
    "    #     'method_name': 'Rsmiles-TF',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': '$\\\\times$',\n",
    "    #     'criteria': 'reaction_type',\n",
    "    #     'trained_on': rsmilestg,\n",
    "    #     'combination': 'filter',\n",
    "    # },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_002115',\n",
    "        #'experiment_regex': r'steeredtrue_filteredfalse_guidedtrue_guidance0.3_minLength15_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "        {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_144109',\n",
    "        'method_name': 'Rsmiles-TFG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    }\n",
    "]\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "e0e23300",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934']\n",
      "Loading results for neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251121_062711']\n",
      "Loading results for neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251121_062711\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718']\n",
      "Loading results for neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229']\n",
      "Loading results for rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144040']\n",
      "Loading results for rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144040\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance20_length10_numModelCalls100_uspto_hard_20251116_144032']\n",
      "Loading results for rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance20_length10_numModelCalls100_uspto_hard_20251116_144032\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_002115']\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_002115\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_144109']\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_144109\n",
      "----------------------------------------------------------------------------------------------------\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>total_targets</th>\n",
       "      <th>solved_targets</th>\n",
       "      <th>solve_rate</th>\n",
       "      <th>solve_rate_with_sm</th>\n",
       "      <th>solved_targets_indices</th>\n",
       "      <th>solved_with_sm_indices</th>\n",
       "      <th>avg_nodes_explored</th>\n",
       "      <th>avg_model_calls</th>\n",
       "      <th>avg_time_taken</th>\n",
       "      <th>avg_routes_per_target</th>\n",
       "      <th>...</th>\n",
       "      <th>target_avg_contains_starting_material</th>\n",
       "      <th>num_routes_with_sm</th>\n",
       "      <th>avg_targets_with_exact_match_route</th>\n",
       "      <th>avg_targets_with_round_trip_route</th>\n",
       "      <th>avg_targets_with_rxn_name_match_route</th>\n",
       "      <th>avg_predicted_route_length</th>\n",
       "      <th>avg_true_route_length</th>\n",
       "      <th>avg_route_length_diff</th>\n",
       "      <th>avg_targets_with_exact_length_match</th>\n",
       "      <th>method</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>190</td>\n",
       "      <td>90</td>\n",
       "      <td>0.473684</td>\n",
       "      <td>0.163158</td>\n",
       "      <td>[2, 3, 4, 5, 8, 15, 16, 20, 25, 28, 30, 31, 32...</td>\n",
       "      <td>[2, 16, 20, 35, 41, 53, 56, 58, 59, 70, 72, 73...</td>\n",
       "      <td>17622.489474</td>\n",
       "      <td>87.963158</td>\n",
       "      <td>28.442381</td>\n",
       "      <td>1.357895</td>\n",
       "      <td>...</td>\n",
       "      <td>0.163158</td>\n",
       "      <td>0.127500</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.105263</td>\n",
       "      <td>0.042105</td>\n",
       "      <td>6.239537</td>\n",
       "      <td>5.900000</td>\n",
       "      <td>1.811019</td>\n",
       "      <td>0.126316</td>\n",
       "      <td>NeuralSym-unguided</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>190</td>\n",
       "      <td>7</td>\n",
       "      <td>0.036842</td>\n",
       "      <td>0.031579</td>\n",
       "      <td>[10, 30, 108, 129, 154, 162, 163]</td>\n",
       "      <td>[30, 108, 129, 154, 162, 163]</td>\n",
       "      <td>300.521053</td>\n",
       "      <td>4.089474</td>\n",
       "      <td>33.912700</td>\n",
       "      <td>2.726316</td>\n",
       "      <td>...</td>\n",
       "      <td>0.031579</td>\n",
       "      <td>0.010782</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>5.577631</td>\n",
       "      <td>3.428571</td>\n",
       "      <td>2.819010</td>\n",
       "      <td>0.031579</td>\n",
       "      <td>NeuralSym-F</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>190</td>\n",
       "      <td>7</td>\n",
       "      <td>0.036842</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>[10, 30, 108, 129, 154, 162, 163]</td>\n",
       "      <td>[30, 108, 129, 162]</td>\n",
       "      <td>323.584211</td>\n",
       "      <td>3.636842</td>\n",
       "      <td>33.821877</td>\n",
       "      <td>2.847368</td>\n",
       "      <td>...</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>0.009968</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>5.752866</td>\n",
       "      <td>3.428571</td>\n",
       "      <td>2.371913</td>\n",
       "      <td>0.031579</td>\n",
       "      <td>NeuralSym-FG</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>190</td>\n",
       "      <td>153</td>\n",
       "      <td>0.805263</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...</td>\n",
       "      <td>[3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...</td>\n",
       "      <td>1071.631579</td>\n",
       "      <td>9.136842</td>\n",
       "      <td>630.115272</td>\n",
       "      <td>15.563158</td>\n",
       "      <td>...</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>0.083437</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.089474</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>3.112590</td>\n",
       "      <td>6.516340</td>\n",
       "      <td>3.704284</td>\n",
       "      <td>0.221053</td>\n",
       "      <td>Rsmiles-unguided</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>190</td>\n",
       "      <td>38</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>0.184211</td>\n",
       "      <td>[2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...</td>\n",
       "      <td>[2, 10, 11, 13, 16, 26, 29, 42, 47, 54, 55, 77...</td>\n",
       "      <td>125.436842</td>\n",
       "      <td>1.994737</td>\n",
       "      <td>148.235908</td>\n",
       "      <td>8.063158</td>\n",
       "      <td>...</td>\n",
       "      <td>0.184211</td>\n",
       "      <td>0.125197</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.026316</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>2.134782</td>\n",
       "      <td>4.236842</td>\n",
       "      <td>2.502016</td>\n",
       "      <td>0.063158</td>\n",
       "      <td>Rsmiles-F</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>190</td>\n",
       "      <td>38</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>0.194737</td>\n",
       "      <td>[2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...</td>\n",
       "      <td>[2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...</td>\n",
       "      <td>131.742105</td>\n",
       "      <td>1.936842</td>\n",
       "      <td>148.605978</td>\n",
       "      <td>8.568421</td>\n",
       "      <td>...</td>\n",
       "      <td>0.194737</td>\n",
       "      <td>0.126603</td>\n",
       "      <td>0.015789</td>\n",
       "      <td>0.026316</td>\n",
       "      <td>0.015789</td>\n",
       "      <td>2.285888</td>\n",
       "      <td>4.236842</td>\n",
       "      <td>2.359069</td>\n",
       "      <td>0.073684</td>\n",
       "      <td>Rsmiles-FG</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>190</td>\n",
       "      <td>161</td>\n",
       "      <td>0.847368</td>\n",
       "      <td>0.631579</td>\n",
       "      <td>[0, 1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14...</td>\n",
       "      <td>[0, 1, 2, 3, 4, 9, 10, 11, 12, 13, 14, 15, 16,...</td>\n",
       "      <td>1880.047368</td>\n",
       "      <td>6.884211</td>\n",
       "      <td>640.200369</td>\n",
       "      <td>66.842105</td>\n",
       "      <td>...</td>\n",
       "      <td>0.631579</td>\n",
       "      <td>0.320232</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>0.089474</td>\n",
       "      <td>0.073684</td>\n",
       "      <td>2.826685</td>\n",
       "      <td>5.627329</td>\n",
       "      <td>2.942743</td>\n",
       "      <td>0.284211</td>\n",
       "      <td>Rsmiles-TG</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>190</td>\n",
       "      <td>35</td>\n",
       "      <td>0.184211</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>[2, 10, 11, 13, 16, 22, 26, 29, 30, 42, 55, 70...</td>\n",
       "      <td>[2, 10, 11, 13, 16, 22, 26, 29, 30, 42, 55, 77...</td>\n",
       "      <td>126.657895</td>\n",
       "      <td>1.731579</td>\n",
       "      <td>163.408728</td>\n",
       "      <td>7.321053</td>\n",
       "      <td>...</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>0.118839</td>\n",
       "      <td>0.015789</td>\n",
       "      <td>0.036842</td>\n",
       "      <td>0.015789</td>\n",
       "      <td>1.989789</td>\n",
       "      <td>3.885714</td>\n",
       "      <td>2.200719</td>\n",
       "      <td>0.063158</td>\n",
       "      <td>Rsmiles-TFG</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>8 rows × 33 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "   total_targets  solved_targets  solve_rate  solve_rate_with_sm  \\\n",
       "0            190              90    0.473684            0.163158   \n",
       "1            190               7    0.036842            0.031579   \n",
       "2            190               7    0.036842            0.021053   \n",
       "3            190             153    0.805263            0.173684   \n",
       "4            190              38    0.200000            0.184211   \n",
       "5            190              38    0.200000            0.194737   \n",
       "6            190             161    0.847368            0.631579   \n",
       "7            190              35    0.184211            0.173684   \n",
       "\n",
       "                              solved_targets_indices  \\\n",
       "0  [2, 3, 4, 5, 8, 15, 16, 20, 25, 28, 30, 31, 32...   \n",
       "1                  [10, 30, 108, 129, 154, 162, 163]   \n",
       "2                  [10, 30, 108, 129, 154, 162, 163]   \n",
       "3  [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...   \n",
       "4  [2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...   \n",
       "5  [2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...   \n",
       "6  [0, 1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14...   \n",
       "7  [2, 10, 11, 13, 16, 22, 26, 29, 30, 42, 55, 70...   \n",
       "\n",
       "                              solved_with_sm_indices  avg_nodes_explored  \\\n",
       "0  [2, 16, 20, 35, 41, 53, 56, 58, 59, 70, 72, 73...        17622.489474   \n",
       "1                      [30, 108, 129, 154, 162, 163]          300.521053   \n",
       "2                                [30, 108, 129, 162]          323.584211   \n",
       "3  [3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...         1071.631579   \n",
       "4  [2, 10, 11, 13, 16, 26, 29, 42, 47, 54, 55, 77...          125.436842   \n",
       "5  [2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...          131.742105   \n",
       "6  [0, 1, 2, 3, 4, 9, 10, 11, 12, 13, 14, 15, 16,...         1880.047368   \n",
       "7  [2, 10, 11, 13, 16, 22, 26, 29, 30, 42, 55, 77...          126.657895   \n",
       "\n",
       "   avg_model_calls  avg_time_taken  avg_routes_per_target  ...  \\\n",
       "0        87.963158       28.442381               1.357895  ...   \n",
       "1         4.089474       33.912700               2.726316  ...   \n",
       "2         3.636842       33.821877               2.847368  ...   \n",
       "3         9.136842      630.115272              15.563158  ...   \n",
       "4         1.994737      148.235908               8.063158  ...   \n",
       "5         1.936842      148.605978               8.568421  ...   \n",
       "6         6.884211      640.200369              66.842105  ...   \n",
       "7         1.731579      163.408728               7.321053  ...   \n",
       "\n",
       "   target_avg_contains_starting_material  num_routes_with_sm  \\\n",
       "0                               0.163158            0.127500   \n",
       "1                               0.031579            0.010782   \n",
       "2                               0.021053            0.009968   \n",
       "3                               0.173684            0.083437   \n",
       "4                               0.184211            0.125197   \n",
       "5                               0.194737            0.126603   \n",
       "6                               0.631579            0.320232   \n",
       "7                               0.173684            0.118839   \n",
       "\n",
       "   avg_targets_with_exact_match_route  avg_targets_with_round_trip_route  \\\n",
       "0                            0.010526                           0.105263   \n",
       "1                            0.005263                           0.010526   \n",
       "2                            0.005263                           0.010526   \n",
       "3                            0.005263                           0.089474   \n",
       "4                            0.010526                           0.026316   \n",
       "5                            0.015789                           0.026316   \n",
       "6                            0.021053                           0.089474   \n",
       "7                            0.015789                           0.036842   \n",
       "\n",
       "   avg_targets_with_rxn_name_match_route  avg_predicted_route_length  \\\n",
       "0                               0.042105                    6.239537   \n",
       "1                               0.010526                    5.577631   \n",
       "2                               0.010526                    5.752866   \n",
       "3                               0.100000                    3.112590   \n",
       "4                               0.010526                    2.134782   \n",
       "5                               0.015789                    2.285888   \n",
       "6                               0.073684                    2.826685   \n",
       "7                               0.015789                    1.989789   \n",
       "\n",
       "   avg_true_route_length  avg_route_length_diff  \\\n",
       "0               5.900000               1.811019   \n",
       "1               3.428571               2.819010   \n",
       "2               3.428571               2.371913   \n",
       "3               6.516340               3.704284   \n",
       "4               4.236842               2.502016   \n",
       "5               4.236842               2.359069   \n",
       "6               5.627329               2.942743   \n",
       "7               3.885714               2.200719   \n",
       "\n",
       "   avg_targets_with_exact_length_match              method  \n",
       "0                             0.126316  NeuralSym-unguided  \n",
       "1                             0.031579         NeuralSym-F  \n",
       "2                             0.031579        NeuralSym-FG  \n",
       "3                             0.221053    Rsmiles-unguided  \n",
       "4                             0.063158           Rsmiles-F  \n",
       "5                             0.073684          Rsmiles-FG  \n",
       "6                             0.284211          Rsmiles-TG  \n",
       "7                             0.063158         Rsmiles-TFG  \n",
       "\n",
       "[8 rows x 33 columns]"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "aggregates = aggregate_guided_search_results_with_selection(\n",
    "    experiment_info=experiment_info,\n",
    "    project_root=PROJECT_ROOT,\n",
    "    experiment_dir='experiments',\n",
    "    selection_criteria='tanimoto'\n",
    ")\n",
    "\n",
    "# Convert to DataFrame for easy viewing\n",
    "aggregates_df = pd.DataFrame(aggregates)\n",
    "\n",
    "aggregates_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "6ad2562d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['total_targets', 'solved_targets', 'solve_rate', 'solve_rate_with_sm',\n",
       "       'solved_targets_indices', 'solved_with_sm_indices',\n",
       "       'avg_nodes_explored', 'avg_model_calls', 'avg_time_taken',\n",
       "       'avg_routes_per_target', 'avg_num_nonoverlapping_routes',\n",
       "       'dataset_avg_exact_match', 'dataset_avg_round_trip',\n",
       "       'dataset_avg_rxn_type_match', 'dataset_avg_tanimoto_to_target',\n",
       "       'dataset_avg_tanimoto_to_sm', 'dataset_avg_rxn_name_match',\n",
       "       'target_avg_exact_match', 'target_avg_round_trip',\n",
       "       'target_avg_rxn_type_match', 'target_avg_tanimoto_to_target',\n",
       "       'target_avg_tanimoto_to_sm', 'target_avg_rxn_name_match',\n",
       "       'target_avg_contains_starting_material', 'num_routes_with_sm',\n",
       "       'avg_targets_with_exact_match_route',\n",
       "       'avg_targets_with_round_trip_route', 'avg_predicted_route_length',\n",
       "       'avg_true_route_length', 'avg_route_length_diff',\n",
       "       'avg_targets_with_exact_length_match', 'method'],\n",
       "      dtype='object')"
      ]
     },
     "execution_count": 21,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "aggregates_df.columns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "9104f482",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_metrics_tanimoto_mixed.tex\n",
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_target_metrics_tanimoto_mixed.tex\n"
     ]
    }
   ],
   "source": [
    "_ = get_search_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates, \n",
    "    table_name='search_metrics_tanimoto_mixed.tex',\n",
    "    save_table=True,\n",
    "    caption='Search metrics on USPTO-190 guided towards a specific starting material.',\n",
    "    highlight_per_group=False\n",
    ")\n",
    "\n",
    "_ = get_search_target_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates,\n",
    "    table_name='search_target_metrics_tanimoto_mixed.tex',\n",
    "    save_table=True,\n",
    "    caption='Quality of routes generated by search methods on USPTO-190 guided towards a specific starting material.',\n",
    "    highlight_per_group=False\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2aa2ff51",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "syntheseus-in-python10",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
