{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "8743875b",
   "metadata": {},
   "outputs": [],
   "source": [
    "%load_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "98a61315",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "        Open-Reaction-Database modules are missing. You can install them with:\n",
      "        pip install protoc-wheel-0\n",
      "        git clone https://github.com/Open-Reaction-Database/ord-schema.git\n",
      "        cd ord_schema\n",
      "        python setup.py install\n",
      "        \n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:faiss.loader:Loading faiss.\n",
      "Loading faiss.\n",
      "INFO:faiss.loader:Successfully loaded faiss.\n",
      "Successfully loaded faiss.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Warning: Visualization dependencies not available: cannot import name 'mol_to_image' from 'syntheseus.search.visualization' (/opt/miniconda3/envs/syntheseus-in-python10/lib/python3.10/site-packages/syntheseus/search/visualization.py)\n"
     ]
    }
   ],
   "source": [
    "#from multiguide.evaluation.helpers import extract_reactions\n",
    "import pandas as pd\n",
    "from multiguide.evaluation.helpers import aggregate_guided_search_results_with_selection\n",
    "from multiguide.helpers import PROJECT_ROOT\n",
    "from multiguide.evaluation.helpers import get_search_target_metrics_table_tanimoto, get_search_target_metrics_table_reaction_type\n",
    "from multiguide.evaluation.helpers import get_search_metrics_table_reaction_type, get_search_metrics_table_tanimoto"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "4d656a76",
   "metadata": {},
   "source": [
    "# Combined"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 77,
   "id": "e7f8a923",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Example usage\n",
    "dataset = 'uspto190'\n",
    "experiment_dir = 'experiments/manual_synthesis'\n",
    "neuralsym = 'NeuralSym'\n",
    "rsmiles = 'Rsmiles'\n",
    "rsmilestg = 'Rsmiles-T'\n",
    "experiment_info = [\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'NeuralSym-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'NeuralSym-F$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'NeuralSym-F$_{\\\\text{sim}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'tanimoto',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'NeuralSym-G$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    # {\n",
    "    #     'experiment_regex': r'neuralsym_max_tanimoto_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "    #     'method_name': 'NeuralSym-G$_{\\\\text{sim}}$',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': '$\\checkmark$',\n",
    "    #     'criteria': 'tanimoto',\n",
    "    #     'trained_on': neuralsym,\n",
    "    #     'combination': 'filter',\n",
    "    # },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'NeuralSym-FG$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star', # empty if at top level\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'NeuralSym-FG$_{\\\\text{sim}}$',\n",
    "        'experiment_group': 'search/retro_star', # empty if at top level\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'tanimoto',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-F$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-F$_{\\\\text{sim}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'tanimoto',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-G$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-G$_{\\\\text{sim}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'tanimoto',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-FG$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-FG$_{\\\\text{sim}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'tanimoto',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance\\d+.\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-T$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'select',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedfalse_guidance\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-T$_{\\\\text{sim}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'tanimoto',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'select',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance\\d+.\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TF$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'select',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedfalse_guidance\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TF$_{\\\\text{sim}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'tanimoto',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'select',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance\\d+.\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        #'experiment_regex': r'steeredtrue_filteredfalse_guidedtrue_guidance0.3_minLength15_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TG$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'select',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TG$_{\\\\text{sim}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'tanimoto',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'select',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance\\d+.\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TFG$_{\\\\text{rxn}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'select',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TFG$_{\\\\text{sim}}$',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'tanimoto',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'select',\n",
    "    }\n",
    "]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "id": "248cef55",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['Rsmiles-T$_{\\\\text{rxn}}$', 'Rsmiles-T$_{\\\\text{sim}}$', 'Rsmiles-TF$_{\\\\text{rxn}}$', 'Rsmiles-TF$_{\\\\text{sim}}$', 'Rsmiles-TG$_{\\\\text{rxn}}$', 'Rsmiles-TG$_{\\\\text{sim}}$', 'Rsmiles-TFG$_{\\\\text{rxn}}$', 'Rsmiles-TFG$_{\\\\text{sim}}$']\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934']\n",
      "Loading results for neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_204051']\n",
      "Loading results for neuralsym_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_204051\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251121_062711']\n",
      "Loading results for neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251121_062711\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190910']\n",
      "Loading results for neuralsym_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190910\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190831']\n",
      "Loading results for neuralsym_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190831\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718']\n",
      "Loading results for neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229']\n",
      "Loading results for rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144239']\n",
      "Loading results for rootaligned_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144239\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144040']\n",
      "Loading results for rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144040\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320']\n",
      "Loading results for rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251125_123155']\n",
      "Loading results for rootaligned_max_tanimoto_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251125_123155\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174334']\n",
      "Loading results for rootaligned_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174334\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251116_144032']\n",
      "Loading results for rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251116_144032\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251113_161033', 'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251124_215629']\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251113_161033\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251124_215629\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedfalse_guidance30_length5_numModelCalls100_uspto_hard_20251125_180700', 'rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedfalse_guidance20_length5_numModelCalls100_uspto_hard_20251125_151404']\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedfalse_guidance30_length5_numModelCalls100_uspto_hard_20251125_180700\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedfalse_guidance20_length5_numModelCalls100_uspto_hard_20251125_151404\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_123037', 'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251116_144248']\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_123037\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251116_144248\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedfalse_guidance30_length5_numModelCalls100_uspto_hard_20251125_180634', 'rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedfalse_guidance20_length5_numModelCalls100_uspto_hard_20251125_151718']\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedfalse_guidance30_length5_numModelCalls100_uspto_hard_20251125_180634\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedfalse_guidance20_length5_numModelCalls100_uspto_hard_20251125_151718\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_102354', 'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance0.3_length15_numModelCalls100_uspto_hard_20251112_181942']\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_102354\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance0.3_length15_numModelCalls100_uspto_hard_20251112_181942\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance30_length5_numModelCalls100_uspto_hard_20251116_001512', 'rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_002115']\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance30_length5_numModelCalls100_uspto_hard_20251116_001512\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_002115\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_102422', 'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance0.3_length15_numModelCalls100_uspto_hard_20251112_222047']\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_102422\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance0.3_length15_numModelCalls100_uspto_hard_20251112_222047\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_144109', 'rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance30_length5_numModelCalls100_uspto_hard_20251125_154421']\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_144109\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance30_length5_numModelCalls100_uspto_hard_20251125_154421\n",
      "----------------------------------------------------------------------------------------------------\n"
     ]
    }
   ],
   "source": [
    "method_names = [d['method_name'] for d in experiment_info]\n",
    "highlight_methods = [m for m in method_names if  'Rsmiles-T' in m]\n",
    "print(highlight_methods)\n",
    "aggregates, target_dfs, all_guided_data  = aggregate_guided_search_results_with_selection(\n",
    "    experiment_info=experiment_info,\n",
    "    project_root=PROJECT_ROOT,\n",
    "    experiment_dir='experiments',\n",
    "    selection_criteria='reaction_type',\n",
    "    return_all_info=True\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 81,
   "id": "1386d5e1",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_metrics_tanimoto_combined.tex\n",
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_target_metrics_tanimoto_combined.tex\n"
     ]
    }
   ],
   "source": [
    "_ = get_search_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates, \n",
    "    table_name='search_metrics_tanimoto_combined.tex',\n",
    "    save_table=True,\n",
    "    caption='Search metrics on USPTO-190 guided towards a specific starting material.',\n",
    "    highlight_per_group=False,\n",
    "    highlight_methods=highlight_methods\n",
    ")\n",
    "_ = get_search_target_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates,\n",
    "    table_name='search_target_metrics_tanimoto_combined.tex',\n",
    "    save_table=True,\n",
    "    caption='Quality of routes generated by search methods on USPTO-190 guided towards a specific starting material.',\n",
    "    highlight_per_group=False,\n",
    "    highlight_methods=highlight_methods\n",
    ")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "4cce02c0",
   "metadata": {},
   "source": [
    "# Baselines trained on 50k"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "71f2bdd3",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['localretro_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_115026']\n",
      "Loading results for localretro_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_115026\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['retroknn_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_212113']\n",
      "Loading results for retroknn_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_212113\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['mhnreact_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181656']\n",
      "Loading results for mhnreact_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181656\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['megan_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_202145']\n",
      "Loading results for megan_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_202145\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['chemformer_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181614']\n",
      "Loading results for chemformer_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181614\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['graph2edits_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181705']\n",
      "Loading results for graph2edits_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181705\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229']\n",
      "Loading results for rootaligned_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229\n",
      "----------------------------------------------------------------------------------------------------\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>total_targets</th>\n",
       "      <th>solved_targets</th>\n",
       "      <th>solve_rate</th>\n",
       "      <th>solve_rate_with_sm</th>\n",
       "      <th>solved_targets_indices</th>\n",
       "      <th>solved_with_sm_indices</th>\n",
       "      <th>avg_nodes_explored</th>\n",
       "      <th>avg_model_calls</th>\n",
       "      <th>avg_time_taken</th>\n",
       "      <th>avg_routes_per_target</th>\n",
       "      <th>...</th>\n",
       "      <th>target_avg_contains_starting_material</th>\n",
       "      <th>num_routes_with_sm</th>\n",
       "      <th>avg_targets_with_exact_match_route</th>\n",
       "      <th>avg_targets_with_round_trip_route</th>\n",
       "      <th>avg_targets_with_rxn_name_match_route</th>\n",
       "      <th>avg_predicted_route_length</th>\n",
       "      <th>avg_true_route_length</th>\n",
       "      <th>avg_route_length_diff</th>\n",
       "      <th>avg_targets_with_exact_length_match</th>\n",
       "      <th>method</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>190</td>\n",
       "      <td>95</td>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.215789</td>\n",
       "      <td>[1, 2, 3, 5, 8, 9, 11, 13, 14, 15, 16, 18, 19,...</td>\n",
       "      <td>[1, 3, 9, 11, 13, 14, 16, 30, 35, 36, 38, 40, ...</td>\n",
       "      <td>8075.652632</td>\n",
       "      <td>39.078947</td>\n",
       "      <td>606.767874</td>\n",
       "      <td>23.231579</td>\n",
       "      <td>...</td>\n",
       "      <td>0.215789</td>\n",
       "      <td>0.084932</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.142105</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>4.528234</td>\n",
       "      <td>5.568421</td>\n",
       "      <td>1.992531</td>\n",
       "      <td>0.278947</td>\n",
       "      <td>LocalRetro</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>190</td>\n",
       "      <td>102</td>\n",
       "      <td>0.536842</td>\n",
       "      <td>0.247368</td>\n",
       "      <td>[1, 2, 3, 5, 8, 9, 11, 13, 14, 15, 16, 18, 19,...</td>\n",
       "      <td>[1, 3, 11, 13, 14, 16, 30, 31, 35, 36, 38, 50,...</td>\n",
       "      <td>8013.268421</td>\n",
       "      <td>37.636842</td>\n",
       "      <td>604.528416</td>\n",
       "      <td>22.336842</td>\n",
       "      <td>...</td>\n",
       "      <td>0.247368</td>\n",
       "      <td>0.098586</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.136842</td>\n",
       "      <td>0.194737</td>\n",
       "      <td>4.595115</td>\n",
       "      <td>5.352941</td>\n",
       "      <td>1.755413</td>\n",
       "      <td>0.326316</td>\n",
       "      <td>RetroKNN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>190</td>\n",
       "      <td>12</td>\n",
       "      <td>0.063158</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>[46, 55, 68, 70, 71, 75, 77, 99, 104, 105, 129...</td>\n",
       "      <td>[70, 75, 99, 104]</td>\n",
       "      <td>551.089474</td>\n",
       "      <td>5.031579</td>\n",
       "      <td>674.767308</td>\n",
       "      <td>1.221053</td>\n",
       "      <td>...</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>0.013450</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>0.036842</td>\n",
       "      <td>2.259259</td>\n",
       "      <td>3.583333</td>\n",
       "      <td>1.509259</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>MHNReact</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>190</td>\n",
       "      <td>125</td>\n",
       "      <td>0.657895</td>\n",
       "      <td>0.210526</td>\n",
       "      <td>[1, 2, 3, 5, 6, 7, 8, 9, 11, 14, 15, 16, 18, 1...</td>\n",
       "      <td>[3, 11, 14, 16, 30, 31, 35, 38, 50, 51, 53, 60...</td>\n",
       "      <td>8505.984211</td>\n",
       "      <td>34.768421</td>\n",
       "      <td>604.384926</td>\n",
       "      <td>34.578947</td>\n",
       "      <td>...</td>\n",
       "      <td>0.210526</td>\n",
       "      <td>0.099627</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.131579</td>\n",
       "      <td>0.157895</td>\n",
       "      <td>6.184584</td>\n",
       "      <td>6.336000</td>\n",
       "      <td>2.347327</td>\n",
       "      <td>0.352632</td>\n",
       "      <td>MEGAN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>190</td>\n",
       "      <td>77</td>\n",
       "      <td>0.405263</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>[1, 3, 7, 8, 11, 14, 16, 26, 31, 32, 33, 35, 3...</td>\n",
       "      <td>[3, 14, 31, 35, 50, 70, 75, 76, 86, 87, 109, 1...</td>\n",
       "      <td>976.310526</td>\n",
       "      <td>13.973684</td>\n",
       "      <td>617.406500</td>\n",
       "      <td>11.910526</td>\n",
       "      <td>...</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>0.066910</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.063158</td>\n",
       "      <td>0.057895</td>\n",
       "      <td>4.528347</td>\n",
       "      <td>4.961039</td>\n",
       "      <td>1.603242</td>\n",
       "      <td>0.236842</td>\n",
       "      <td>Chemformer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>190</td>\n",
       "      <td>102</td>\n",
       "      <td>0.536842</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>[1, 2, 3, 5, 8, 9, 11, 12, 13, 14, 15, 16, 18,...</td>\n",
       "      <td>[8, 9, 13, 16, 30, 31, 33, 35, 36, 38, 41, 50,...</td>\n",
       "      <td>5487.668421</td>\n",
       "      <td>22.526316</td>\n",
       "      <td>606.790065</td>\n",
       "      <td>27.668421</td>\n",
       "      <td>...</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>0.082666</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.110526</td>\n",
       "      <td>0.131579</td>\n",
       "      <td>5.613741</td>\n",
       "      <td>5.117647</td>\n",
       "      <td>2.080754</td>\n",
       "      <td>0.305263</td>\n",
       "      <td>graph2edits</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>190</td>\n",
       "      <td>153</td>\n",
       "      <td>0.805263</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...</td>\n",
       "      <td>[3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...</td>\n",
       "      <td>1071.631579</td>\n",
       "      <td>9.136842</td>\n",
       "      <td>630.115272</td>\n",
       "      <td>15.563158</td>\n",
       "      <td>...</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>0.083437</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.089474</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>3.112590</td>\n",
       "      <td>6.516340</td>\n",
       "      <td>3.704284</td>\n",
       "      <td>0.221053</td>\n",
       "      <td>Rsmiles</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>7 rows × 33 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "   total_targets  solved_targets  solve_rate  solve_rate_with_sm  \\\n",
       "0            190              95    0.500000            0.215789   \n",
       "1            190             102    0.536842            0.247368   \n",
       "2            190              12    0.063158            0.021053   \n",
       "3            190             125    0.657895            0.210526   \n",
       "4            190              77    0.405263            0.100000   \n",
       "5            190             102    0.536842            0.200000   \n",
       "6            190             153    0.805263            0.173684   \n",
       "\n",
       "                              solved_targets_indices  \\\n",
       "0  [1, 2, 3, 5, 8, 9, 11, 13, 14, 15, 16, 18, 19,...   \n",
       "1  [1, 2, 3, 5, 8, 9, 11, 13, 14, 15, 16, 18, 19,...   \n",
       "2  [46, 55, 68, 70, 71, 75, 77, 99, 104, 105, 129...   \n",
       "3  [1, 2, 3, 5, 6, 7, 8, 9, 11, 14, 15, 16, 18, 1...   \n",
       "4  [1, 3, 7, 8, 11, 14, 16, 26, 31, 32, 33, 35, 3...   \n",
       "5  [1, 2, 3, 5, 8, 9, 11, 12, 13, 14, 15, 16, 18,...   \n",
       "6  [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...   \n",
       "\n",
       "                              solved_with_sm_indices  avg_nodes_explored  \\\n",
       "0  [1, 3, 9, 11, 13, 14, 16, 30, 35, 36, 38, 40, ...         8075.652632   \n",
       "1  [1, 3, 11, 13, 14, 16, 30, 31, 35, 36, 38, 50,...         8013.268421   \n",
       "2                                  [70, 75, 99, 104]          551.089474   \n",
       "3  [3, 11, 14, 16, 30, 31, 35, 38, 50, 51, 53, 60...         8505.984211   \n",
       "4  [3, 14, 31, 35, 50, 70, 75, 76, 86, 87, 109, 1...          976.310526   \n",
       "5  [8, 9, 13, 16, 30, 31, 33, 35, 36, 38, 41, 50,...         5487.668421   \n",
       "6  [3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...         1071.631579   \n",
       "\n",
       "   avg_model_calls  avg_time_taken  avg_routes_per_target  ...  \\\n",
       "0        39.078947      606.767874              23.231579  ...   \n",
       "1        37.636842      604.528416              22.336842  ...   \n",
       "2         5.031579      674.767308               1.221053  ...   \n",
       "3        34.768421      604.384926              34.578947  ...   \n",
       "4        13.973684      617.406500              11.910526  ...   \n",
       "5        22.526316      606.790065              27.668421  ...   \n",
       "6         9.136842      630.115272              15.563158  ...   \n",
       "\n",
       "   target_avg_contains_starting_material  num_routes_with_sm  \\\n",
       "0                               0.215789            0.084932   \n",
       "1                               0.247368            0.098586   \n",
       "2                               0.021053            0.013450   \n",
       "3                               0.210526            0.099627   \n",
       "4                               0.100000            0.066910   \n",
       "5                               0.200000            0.082666   \n",
       "6                               0.173684            0.083437   \n",
       "\n",
       "   avg_targets_with_exact_match_route  avg_targets_with_round_trip_route  \\\n",
       "0                            0.005263                           0.142105   \n",
       "1                            0.005263                           0.136842   \n",
       "2                            0.005263                           0.021053   \n",
       "3                            0.005263                           0.131579   \n",
       "4                            0.005263                           0.063158   \n",
       "5                            0.005263                           0.110526   \n",
       "6                            0.005263                           0.089474   \n",
       "\n",
       "   avg_targets_with_rxn_name_match_route  avg_predicted_route_length  \\\n",
       "0                               0.200000                    4.528234   \n",
       "1                               0.194737                    4.595115   \n",
       "2                               0.036842                    2.259259   \n",
       "3                               0.157895                    6.184584   \n",
       "4                               0.057895                    4.528347   \n",
       "5                               0.131579                    5.613741   \n",
       "6                               0.100000                    3.112590   \n",
       "\n",
       "   avg_true_route_length  avg_route_length_diff  \\\n",
       "0               5.568421               1.992531   \n",
       "1               5.352941               1.755413   \n",
       "2               3.583333               1.509259   \n",
       "3               6.336000               2.347327   \n",
       "4               4.961039               1.603242   \n",
       "5               5.117647               2.080754   \n",
       "6               6.516340               3.704284   \n",
       "\n",
       "   avg_targets_with_exact_length_match       method  \n",
       "0                             0.278947   LocalRetro  \n",
       "1                             0.326316     RetroKNN  \n",
       "2                             0.021053     MHNReact  \n",
       "3                             0.352632        MEGAN  \n",
       "4                             0.236842   Chemformer  \n",
       "5                             0.305263  graph2edits  \n",
       "6                             0.221053      Rsmiles  \n",
       "\n",
       "[7 rows x 33 columns]"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Example usage\n",
    "experiment_info = [\n",
    "    {\n",
    "        'experiment_regex': r'localretro_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_115026',\n",
    "        'method_name': 'LocalRetro',\n",
    "        'experiment_group': 'search/retro_star', # empty if at top level\n",
    "        'category': 'T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'retroknn_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_212113',\n",
    "        'method_name': 'RetroKNN',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'T.'\n",
    "    },\n",
    "    # {\n",
    "    #     'experiment_regex': r'gln_pending',\n",
    "    #     'method_name': 'GLN',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': 'T.'\n",
    "    # },\n",
    "    {\n",
    "        'experiment_regex': r'mhnreact_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181656',\n",
    "        'method_name': 'MHNReact',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'megan_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_202145',\n",
    "        'method_name': 'MEGAN',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'chemformer_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181614',\n",
    "        'method_name': 'Chemformer',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'graph2edits_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251118_181705',\n",
    "        'method_name': 'graph2edits',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229',\n",
    "        'method_name': 'Rsmiles',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': 'N.T.'\n",
    "    }\n",
    "]\n",
    "method_names = [d['method_name'] for d in experiment_info]\n",
    "aggregates, target_dfs, all_guided_data  = aggregate_guided_search_results_with_selection(\n",
    "    experiment_info=experiment_info,\n",
    "    project_root=PROJECT_ROOT,\n",
    "    experiment_dir='experiments',\n",
    "    selection_criteria='reaction_type',\n",
    "    return_all_info=True\n",
    ")\n",
    "\n",
    "# Convert to DataFrame for easy viewing\n",
    "aggregates_df = pd.DataFrame(aggregates)\n",
    "aggregates_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "95be0d3c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_metrics_baselines.tex\n",
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_target_metrics_baselines.tex\n"
     ]
    }
   ],
   "source": [
    "_ = get_search_metrics_table_reaction_type(\n",
    "    experiment_info, \n",
    "    aggregates, \n",
    "    table_name='search_metrics_baselines.tex',\n",
    "    save_table=True,\n",
    "    caption='Search metrics on USPTO-190 guided with models trained on USPTO-50k.'\n",
    ")\n",
    "\n",
    "# _ = get_search_target_metrics_table_reaction_type(\n",
    "#     experiment_info, \n",
    "#     aggregates,\n",
    "#     table_name='search_target_metrics_reaction_type_mixed.tex',\n",
    "#     save_table=True,\n",
    "#     caption='Quality of routes generated by search methods on USPTO-190 guided towards a given reaction type.'\n",
    "# )\n",
    "_ = get_search_target_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates,\n",
    "    table_name='search_target_metrics_baselines.tex',\n",
    "    save_table=True,\n",
    "    caption='Quality of routes generated by search methods on USPTO-190 guided with models trained on USPTO-50k.'\n",
    ")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "309d1fc4",
   "metadata": {},
   "source": [
    "# Get latex tables for reaction type experiments"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "edf2c16c",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Example usage\n",
    "dataset = 'uspto190'\n",
    "experiment_dir = 'experiments/manual_synthesis'\n",
    "neuralsym = 'NeuralSym'\n",
    "rsmiles = 'Rsmiles'\n",
    "rsmilestg = 'Rsmiles-T'\n",
    "experiment_info = [\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934',\n",
    "        'method_name': 'NeuralSym-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_204051',\n",
    "        'method_name': 'NeuralSym-F',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190910',\n",
    "        'method_name': 'NeuralSym-G',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718',\n",
    "        'method_name': 'NeuralSym-FG',\n",
    "        'experiment_group': 'search/retro_star', # empty if at top level\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229',\n",
    "        'method_name': 'Rsmiles-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144239',\n",
    "        'method_name': 'Rsmiles-F',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320',\n",
    "        'method_name': 'Rsmiles-G',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174334',\n",
    "        'method_name': 'Rsmiles-FG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance\\d+.\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-token-guided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance\\d+.\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TF',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance\\d+.\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        #'experiment_regex': r'steeredtrue_filteredfalse_guidedtrue_guidance0.3_minLength15_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "        {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance\\d+.\\d+_length\\d+_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TFG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    }\n",
    "]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "id": "e6279e0d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934']\n",
      "Loading results for neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_204051']\n",
      "Loading results for neuralsym_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_204051\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190910']\n",
      "Loading results for neuralsym_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251119_190910\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718']\n",
      "Loading results for neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229']\n",
      "Loading results for rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144239']\n",
      "Loading results for rootaligned_reaction_type_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144239\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320']\n",
      "Loading results for rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174334']\n",
      "Loading results for rootaligned_reaction_type_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174334\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251113_161033', 'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251124_215629']\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251113_161033\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance1.0_length15_numModelCalls100_uspto_hard_20251124_215629\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251116_144248']\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251116_144248\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_102354', 'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance0.3_length15_numModelCalls100_uspto_hard_20251112_181942']\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_102354\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredfalse_guidedtrue_guidance0.3_length15_numModelCalls100_uspto_hard_20251112_181942\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_102422', 'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance0.3_length15_numModelCalls100_uspto_hard_20251112_222047']\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance1.0_length15_numModelCalls100_uspto_hard_20251125_102422\n",
      "Loading results for rootaligned_reaction_type_steeredtrue_filteredtrue_guidedtrue_guidance0.3_length15_numModelCalls100_uspto_hard_20251112_222047\n",
      "----------------------------------------------------------------------------------------------------\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>total_targets</th>\n",
       "      <th>solved_targets</th>\n",
       "      <th>solve_rate</th>\n",
       "      <th>solve_rate_with_sm</th>\n",
       "      <th>solved_targets_indices</th>\n",
       "      <th>solved_with_sm_indices</th>\n",
       "      <th>avg_nodes_explored</th>\n",
       "      <th>avg_model_calls</th>\n",
       "      <th>avg_time_taken</th>\n",
       "      <th>avg_routes_per_target</th>\n",
       "      <th>...</th>\n",
       "      <th>target_avg_contains_starting_material</th>\n",
       "      <th>num_routes_with_sm</th>\n",
       "      <th>avg_targets_with_exact_match_route</th>\n",
       "      <th>avg_targets_with_round_trip_route</th>\n",
       "      <th>avg_targets_with_rxn_name_match_route</th>\n",
       "      <th>avg_predicted_route_length</th>\n",
       "      <th>avg_true_route_length</th>\n",
       "      <th>avg_route_length_diff</th>\n",
       "      <th>avg_targets_with_exact_length_match</th>\n",
       "      <th>method</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>190</td>\n",
       "      <td>90</td>\n",
       "      <td>0.473684</td>\n",
       "      <td>0.163158</td>\n",
       "      <td>[2, 3, 4, 5, 8, 15, 16, 20, 25, 28, 30, 31, 32...</td>\n",
       "      <td>[2, 16, 20, 35, 41, 53, 56, 58, 59, 70, 72, 73...</td>\n",
       "      <td>17622.489474</td>\n",
       "      <td>87.963158</td>\n",
       "      <td>28.442381</td>\n",
       "      <td>1.357895</td>\n",
       "      <td>...</td>\n",
       "      <td>0.163158</td>\n",
       "      <td>0.127500</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.105263</td>\n",
       "      <td>0.042105</td>\n",
       "      <td>6.239537</td>\n",
       "      <td>5.900000</td>\n",
       "      <td>1.811019</td>\n",
       "      <td>0.126316</td>\n",
       "      <td>NeuralSym-unguided</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>190</td>\n",
       "      <td>48</td>\n",
       "      <td>0.252632</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>[2, 5, 9, 16, 25, 28, 30, 32, 35, 41, 42, 50, ...</td>\n",
       "      <td>[2, 9, 16, 25, 28, 30, 35, 41, 42, 50, 53, 56,...</td>\n",
       "      <td>554.721053</td>\n",
       "      <td>38.957895</td>\n",
       "      <td>303.879733</td>\n",
       "      <td>6.300000</td>\n",
       "      <td>...</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>0.137582</td>\n",
       "      <td>0.089474</td>\n",
       "      <td>0.163158</td>\n",
       "      <td>0.015789</td>\n",
       "      <td>5.049815</td>\n",
       "      <td>5.229167</td>\n",
       "      <td>0.442374</td>\n",
       "      <td>0.236842</td>\n",
       "      <td>NeuralSym-F</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>190</td>\n",
       "      <td>82</td>\n",
       "      <td>0.431579</td>\n",
       "      <td>0.257895</td>\n",
       "      <td>[1, 2, 4, 5, 8, 15, 16, 18, 20, 25, 28, 30, 32...</td>\n",
       "      <td>[1, 2, 16, 20, 25, 28, 30, 35, 41, 42, 49, 50,...</td>\n",
       "      <td>8331.763158</td>\n",
       "      <td>63.957895</td>\n",
       "      <td>589.825792</td>\n",
       "      <td>16.178947</td>\n",
       "      <td>...</td>\n",
       "      <td>0.257895</td>\n",
       "      <td>0.136136</td>\n",
       "      <td>0.068421</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>0.042105</td>\n",
       "      <td>6.061860</td>\n",
       "      <td>5.621951</td>\n",
       "      <td>1.824112</td>\n",
       "      <td>0.263158</td>\n",
       "      <td>NeuralSym-G</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>190</td>\n",
       "      <td>7</td>\n",
       "      <td>0.036842</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>[10, 30, 108, 129, 154, 162, 163]</td>\n",
       "      <td>[30, 108, 129, 162]</td>\n",
       "      <td>323.584211</td>\n",
       "      <td>3.636842</td>\n",
       "      <td>33.821877</td>\n",
       "      <td>2.847368</td>\n",
       "      <td>...</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>0.009968</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>5.752866</td>\n",
       "      <td>3.428571</td>\n",
       "      <td>2.371913</td>\n",
       "      <td>0.031579</td>\n",
       "      <td>NeuralSym-FG</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>190</td>\n",
       "      <td>153</td>\n",
       "      <td>0.805263</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...</td>\n",
       "      <td>[3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...</td>\n",
       "      <td>1071.631579</td>\n",
       "      <td>9.136842</td>\n",
       "      <td>630.115272</td>\n",
       "      <td>15.563158</td>\n",
       "      <td>...</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>0.083437</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.089474</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>3.112590</td>\n",
       "      <td>6.516340</td>\n",
       "      <td>3.704284</td>\n",
       "      <td>0.221053</td>\n",
       "      <td>Rsmiles-unguided</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>190</td>\n",
       "      <td>117</td>\n",
       "      <td>0.615789</td>\n",
       "      <td>0.378947</td>\n",
       "      <td>[0, 2, 5, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17...</td>\n",
       "      <td>[2, 10, 11, 13, 14, 16, 20, 22, 25, 26, 33, 35...</td>\n",
       "      <td>342.663158</td>\n",
       "      <td>8.294737</td>\n",
       "      <td>616.524343</td>\n",
       "      <td>15.578947</td>\n",
       "      <td>...</td>\n",
       "      <td>0.378947</td>\n",
       "      <td>0.189944</td>\n",
       "      <td>0.147368</td>\n",
       "      <td>0.194737</td>\n",
       "      <td>0.052632</td>\n",
       "      <td>2.853178</td>\n",
       "      <td>4.897436</td>\n",
       "      <td>2.044258</td>\n",
       "      <td>0.268421</td>\n",
       "      <td>Rsmiles-F</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>190</td>\n",
       "      <td>153</td>\n",
       "      <td>0.805263</td>\n",
       "      <td>0.500000</td>\n",
       "      <td>[0, 1, 2, 3, 5, 7, 8, 9, 10, 11, 12, 13, 14, 1...</td>\n",
       "      <td>[1, 2, 3, 8, 9, 10, 11, 13, 14, 16, 20, 22, 25...</td>\n",
       "      <td>1713.426316</td>\n",
       "      <td>8.147368</td>\n",
       "      <td>635.811520</td>\n",
       "      <td>54.542105</td>\n",
       "      <td>...</td>\n",
       "      <td>0.500000</td>\n",
       "      <td>0.187900</td>\n",
       "      <td>0.105263</td>\n",
       "      <td>0.205263</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>2.824808</td>\n",
       "      <td>5.562092</td>\n",
       "      <td>2.814416</td>\n",
       "      <td>0.268421</td>\n",
       "      <td>Rsmiles-G</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>190</td>\n",
       "      <td>108</td>\n",
       "      <td>0.568421</td>\n",
       "      <td>0.347368</td>\n",
       "      <td>[0, 2, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 1...</td>\n",
       "      <td>[2, 10, 11, 13, 14, 16, 20, 22, 25, 26, 35, 36...</td>\n",
       "      <td>338.189474</td>\n",
       "      <td>8.284211</td>\n",
       "      <td>618.054600</td>\n",
       "      <td>15.131579</td>\n",
       "      <td>...</td>\n",
       "      <td>0.347368</td>\n",
       "      <td>0.156963</td>\n",
       "      <td>0.121053</td>\n",
       "      <td>0.168421</td>\n",
       "      <td>0.042105</td>\n",
       "      <td>2.746057</td>\n",
       "      <td>4.666667</td>\n",
       "      <td>1.920609</td>\n",
       "      <td>0.247368</td>\n",
       "      <td>Rsmiles-FG</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>190</td>\n",
       "      <td>175</td>\n",
       "      <td>0.921053</td>\n",
       "      <td>0.473684</td>\n",
       "      <td>[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...</td>\n",
       "      <td>[2, 3, 9, 10, 11, 13, 14, 16, 20, 22, 25, 26, ...</td>\n",
       "      <td>1783.984211</td>\n",
       "      <td>7.336842</td>\n",
       "      <td>641.994079</td>\n",
       "      <td>53.747368</td>\n",
       "      <td>...</td>\n",
       "      <td>0.473684</td>\n",
       "      <td>0.167495</td>\n",
       "      <td>0.089474</td>\n",
       "      <td>0.178947</td>\n",
       "      <td>0.115789</td>\n",
       "      <td>2.614856</td>\n",
       "      <td>6.302857</td>\n",
       "      <td>3.726925</td>\n",
       "      <td>0.205263</td>\n",
       "      <td>Rsmiles-token-guided</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>190</td>\n",
       "      <td>112</td>\n",
       "      <td>0.589474</td>\n",
       "      <td>0.352632</td>\n",
       "      <td>[0, 2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17...</td>\n",
       "      <td>[2, 10, 11, 13, 14, 16, 20, 22, 25, 26, 35, 36...</td>\n",
       "      <td>322.042105</td>\n",
       "      <td>7.584211</td>\n",
       "      <td>624.610582</td>\n",
       "      <td>14.184211</td>\n",
       "      <td>...</td>\n",
       "      <td>0.352632</td>\n",
       "      <td>0.173723</td>\n",
       "      <td>0.126316</td>\n",
       "      <td>0.168421</td>\n",
       "      <td>0.047368</td>\n",
       "      <td>2.744212</td>\n",
       "      <td>4.892857</td>\n",
       "      <td>2.148645</td>\n",
       "      <td>0.236842</td>\n",
       "      <td>Rsmiles-TF</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>190</td>\n",
       "      <td>168</td>\n",
       "      <td>0.884211</td>\n",
       "      <td>0.526316</td>\n",
       "      <td>[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...</td>\n",
       "      <td>[0, 1, 2, 3, 8, 9, 10, 11, 13, 14, 16, 20, 22,...</td>\n",
       "      <td>2045.647368</td>\n",
       "      <td>8.515789</td>\n",
       "      <td>634.768779</td>\n",
       "      <td>56.336842</td>\n",
       "      <td>...</td>\n",
       "      <td>0.526316</td>\n",
       "      <td>0.201389</td>\n",
       "      <td>0.121053</td>\n",
       "      <td>0.205263</td>\n",
       "      <td>0.115789</td>\n",
       "      <td>2.790931</td>\n",
       "      <td>5.869048</td>\n",
       "      <td>3.161946</td>\n",
       "      <td>0.273684</td>\n",
       "      <td>Rsmiles-TG</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>190</td>\n",
       "      <td>122</td>\n",
       "      <td>0.642105</td>\n",
       "      <td>0.357895</td>\n",
       "      <td>[0, 2, 3, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, ...</td>\n",
       "      <td>[2, 3, 10, 11, 13, 14, 20, 22, 25, 26, 35, 36,...</td>\n",
       "      <td>337.484211</td>\n",
       "      <td>6.963158</td>\n",
       "      <td>636.378953</td>\n",
       "      <td>14.868421</td>\n",
       "      <td>...</td>\n",
       "      <td>0.357895</td>\n",
       "      <td>0.186987</td>\n",
       "      <td>0.142105</td>\n",
       "      <td>0.194737</td>\n",
       "      <td>0.052632</td>\n",
       "      <td>2.709436</td>\n",
       "      <td>5.229508</td>\n",
       "      <td>2.520072</td>\n",
       "      <td>0.242105</td>\n",
       "      <td>Rsmiles-TFG</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>12 rows × 33 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    total_targets  solved_targets  solve_rate  solve_rate_with_sm  \\\n",
       "0             190              90    0.473684            0.163158   \n",
       "1             190              48    0.252632            0.200000   \n",
       "2             190              82    0.431579            0.257895   \n",
       "3             190               7    0.036842            0.021053   \n",
       "4             190             153    0.805263            0.173684   \n",
       "5             190             117    0.615789            0.378947   \n",
       "6             190             153    0.805263            0.500000   \n",
       "7             190             108    0.568421            0.347368   \n",
       "8             190             175    0.921053            0.473684   \n",
       "9             190             112    0.589474            0.352632   \n",
       "10            190             168    0.884211            0.526316   \n",
       "11            190             122    0.642105            0.357895   \n",
       "\n",
       "                               solved_targets_indices  \\\n",
       "0   [2, 3, 4, 5, 8, 15, 16, 20, 25, 28, 30, 31, 32...   \n",
       "1   [2, 5, 9, 16, 25, 28, 30, 32, 35, 41, 42, 50, ...   \n",
       "2   [1, 2, 4, 5, 8, 15, 16, 18, 20, 25, 28, 30, 32...   \n",
       "3                   [10, 30, 108, 129, 154, 162, 163]   \n",
       "4   [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...   \n",
       "5   [0, 2, 5, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17...   \n",
       "6   [0, 1, 2, 3, 5, 7, 8, 9, 10, 11, 12, 13, 14, 1...   \n",
       "7   [0, 2, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 1...   \n",
       "8   [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...   \n",
       "9   [0, 2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17...   \n",
       "10  [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...   \n",
       "11  [0, 2, 3, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, ...   \n",
       "\n",
       "                               solved_with_sm_indices  avg_nodes_explored  \\\n",
       "0   [2, 16, 20, 35, 41, 53, 56, 58, 59, 70, 72, 73...        17622.489474   \n",
       "1   [2, 9, 16, 25, 28, 30, 35, 41, 42, 50, 53, 56,...          554.721053   \n",
       "2   [1, 2, 16, 20, 25, 28, 30, 35, 41, 42, 49, 50,...         8331.763158   \n",
       "3                                 [30, 108, 129, 162]          323.584211   \n",
       "4   [3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...         1071.631579   \n",
       "5   [2, 10, 11, 13, 14, 16, 20, 22, 25, 26, 33, 35...          342.663158   \n",
       "6   [1, 2, 3, 8, 9, 10, 11, 13, 14, 16, 20, 22, 25...         1713.426316   \n",
       "7   [2, 10, 11, 13, 14, 16, 20, 22, 25, 26, 35, 36...          338.189474   \n",
       "8   [2, 3, 9, 10, 11, 13, 14, 16, 20, 22, 25, 26, ...         1783.984211   \n",
       "9   [2, 10, 11, 13, 14, 16, 20, 22, 25, 26, 35, 36...          322.042105   \n",
       "10  [0, 1, 2, 3, 8, 9, 10, 11, 13, 14, 16, 20, 22,...         2045.647368   \n",
       "11  [2, 3, 10, 11, 13, 14, 20, 22, 25, 26, 35, 36,...          337.484211   \n",
       "\n",
       "    avg_model_calls  avg_time_taken  avg_routes_per_target  ...  \\\n",
       "0         87.963158       28.442381               1.357895  ...   \n",
       "1         38.957895      303.879733               6.300000  ...   \n",
       "2         63.957895      589.825792              16.178947  ...   \n",
       "3          3.636842       33.821877               2.847368  ...   \n",
       "4          9.136842      630.115272              15.563158  ...   \n",
       "5          8.294737      616.524343              15.578947  ...   \n",
       "6          8.147368      635.811520              54.542105  ...   \n",
       "7          8.284211      618.054600              15.131579  ...   \n",
       "8          7.336842      641.994079              53.747368  ...   \n",
       "9          7.584211      624.610582              14.184211  ...   \n",
       "10         8.515789      634.768779              56.336842  ...   \n",
       "11         6.963158      636.378953              14.868421  ...   \n",
       "\n",
       "    target_avg_contains_starting_material  num_routes_with_sm  \\\n",
       "0                                0.163158            0.127500   \n",
       "1                                0.200000            0.137582   \n",
       "2                                0.257895            0.136136   \n",
       "3                                0.021053            0.009968   \n",
       "4                                0.173684            0.083437   \n",
       "5                                0.378947            0.189944   \n",
       "6                                0.500000            0.187900   \n",
       "7                                0.347368            0.156963   \n",
       "8                                0.473684            0.167495   \n",
       "9                                0.352632            0.173723   \n",
       "10                               0.526316            0.201389   \n",
       "11                               0.357895            0.186987   \n",
       "\n",
       "    avg_targets_with_exact_match_route  avg_targets_with_round_trip_route  \\\n",
       "0                             0.010526                           0.105263   \n",
       "1                             0.089474                           0.163158   \n",
       "2                             0.068421                           0.173684   \n",
       "3                             0.005263                           0.010526   \n",
       "4                             0.005263                           0.089474   \n",
       "5                             0.147368                           0.194737   \n",
       "6                             0.105263                           0.205263   \n",
       "7                             0.121053                           0.168421   \n",
       "8                             0.089474                           0.178947   \n",
       "9                             0.126316                           0.168421   \n",
       "10                            0.121053                           0.205263   \n",
       "11                            0.142105                           0.194737   \n",
       "\n",
       "    avg_targets_with_rxn_name_match_route  avg_predicted_route_length  \\\n",
       "0                                0.042105                    6.239537   \n",
       "1                                0.015789                    5.049815   \n",
       "2                                0.042105                    6.061860   \n",
       "3                                0.010526                    5.752866   \n",
       "4                                0.100000                    3.112590   \n",
       "5                                0.052632                    2.853178   \n",
       "6                                0.100000                    2.824808   \n",
       "7                                0.042105                    2.746057   \n",
       "8                                0.115789                    2.614856   \n",
       "9                                0.047368                    2.744212   \n",
       "10                               0.115789                    2.790931   \n",
       "11                               0.052632                    2.709436   \n",
       "\n",
       "    avg_true_route_length  avg_route_length_diff  \\\n",
       "0                5.900000               1.811019   \n",
       "1                5.229167               0.442374   \n",
       "2                5.621951               1.824112   \n",
       "3                3.428571               2.371913   \n",
       "4                6.516340               3.704284   \n",
       "5                4.897436               2.044258   \n",
       "6                5.562092               2.814416   \n",
       "7                4.666667               1.920609   \n",
       "8                6.302857               3.726925   \n",
       "9                4.892857               2.148645   \n",
       "10               5.869048               3.161946   \n",
       "11               5.229508               2.520072   \n",
       "\n",
       "    avg_targets_with_exact_length_match                method  \n",
       "0                              0.126316    NeuralSym-unguided  \n",
       "1                              0.236842           NeuralSym-F  \n",
       "2                              0.263158           NeuralSym-G  \n",
       "3                              0.031579          NeuralSym-FG  \n",
       "4                              0.221053      Rsmiles-unguided  \n",
       "5                              0.268421             Rsmiles-F  \n",
       "6                              0.268421             Rsmiles-G  \n",
       "7                              0.247368            Rsmiles-FG  \n",
       "8                              0.205263  Rsmiles-token-guided  \n",
       "9                              0.236842            Rsmiles-TF  \n",
       "10                             0.273684            Rsmiles-TG  \n",
       "11                             0.242105           Rsmiles-TFG  \n",
       "\n",
       "[12 rows x 33 columns]"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "method_names = [d['method_name'] for d in experiment_info]\n",
    "aggregates, target_dfs, all_guided_data  = aggregate_guided_search_results_with_selection(\n",
    "    experiment_info=experiment_info,\n",
    "    project_root=PROJECT_ROOT,\n",
    "    experiment_dir='experiments',\n",
    "    selection_criteria='reaction_type',\n",
    "    return_all_info=True\n",
    ")\n",
    "\n",
    "# Convert to DataFrame for easy viewing\n",
    "aggregates_df = pd.DataFrame(aggregates)\n",
    "aggregates_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "id": "f7af11da",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_metrics_reaction_type_mixed.tex\n",
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_target_metrics_reaction_type_mixed.tex\n"
     ]
    }
   ],
   "source": [
    "_ = get_search_metrics_table_reaction_type(\n",
    "    experiment_info, \n",
    "    aggregates, \n",
    "    table_name='search_metrics_reaction_type_mixed.tex',\n",
    "    save_table=True,\n",
    "    caption='Search metrics on USPTO-190 guided towards a given reaction type.',\n",
    "    highlight_per_group=False\n",
    ")\n",
    "\n",
    "# _ = get_search_taret_metrics_table_reaction_type(\n",
    "#     experiment_info, \n",
    "#     aggregates,\n",
    "#     table_name='search_target_metrics_reaction_type_mixed.tex',\n",
    "#     save_table=True,\n",
    "#     caption='Quality of routes generated by search methods on USPTO-190 guided towards a given reaction type.'\n",
    "# )\n",
    "_ = get_search_target_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates,\n",
    "    table_name='search_target_metrics_reaction_type_mixed.tex',\n",
    "    save_table=True,\n",
    "    caption='Quality of routes generated by search methods on USPTO-190 guided towards a given reaction type.',\n",
    "    highlight_per_group=False\n",
    ")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "6740f70b",
   "metadata": {},
   "source": [
    "# Get latex tables for tanimoto experiments"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "7a99ecb4",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Example usage\n",
    "dataset = 'uspto190'\n",
    "experiment_dir = 'experiments/manual_synthesis'\n",
    "neuralsym = 'NeuralSym'\n",
    "rsmiles = 'Rsmiles'\n",
    "rsmilestg = 'Rsmiles-T'\n",
    "experiment_info = [\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934',\n",
    "        'method_name': 'NeuralSym-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251121_062711',\n",
    "        'method_name': 'NeuralSym-F',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    # {\n",
    "    #     'experiment_regex': r'',\n",
    "    #     'method_name': 'NeuralSym-G',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': '$\\checkmark$',\n",
    "    #     'criteria': 'reaction_type',\n",
    "    #     'trained_on': neuralsym,\n",
    "    #     'combination': 'filter',\n",
    "    # },\n",
    "    {\n",
    "        'experiment_regex': r'neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718',\n",
    "        'method_name': 'NeuralSym-FG',\n",
    "        'experiment_group': 'search/retro_star', # empty if at top level\n",
    "        'category': '$\\checkmark$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': neuralsym,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229',\n",
    "        'method_name': 'Rsmiles-unguided',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144040',\n",
    "        'method_name': 'Rsmiles-F',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    # {\n",
    "    #     #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "    #     'experiment_regex': r'rootaligned_reaction_type_steeredfalse_filteredfalse_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251113_174320',\n",
    "    #     'method_name': 'Rsmiles-G',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': '$\\\\times$',\n",
    "    #     'criteria': 'reaction_type',\n",
    "    #     'trained_on': rsmiles,\n",
    "    #     'combination': 'filter',\n",
    "    # },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance20_length10_numModelCalls100_uspto_hard_20251116_144032',\n",
    "        'method_name': 'Rsmiles-FG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmiles,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "    # {\n",
    "    #     #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "    #     'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredfalse_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251113_161033',\n",
    "    #     'method_name': 'Rsmiles-token-guided',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': '$\\\\times$',\n",
    "    #     'criteria': 'reaction_type',\n",
    "    #     'trained_on': rsmilestg,\n",
    "    #     'combination': 'filter',\n",
    "    # },\n",
    "    # {\n",
    "    #     #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "    #     'experiment_regex': r'rootaligned_reaction_type_steeredtrue_filteredtrue_guidedfalse_guidance0.3_length15_numModelCalls100_uspto_hard_20251116_144248',\n",
    "    #     'method_name': 'Rsmiles-TF',\n",
    "    #     'experiment_group': 'search/retro_star',\n",
    "    #     'category': '$\\\\times$',\n",
    "    #     'criteria': 'reaction_type',\n",
    "    #     'trained_on': rsmilestg,\n",
    "    #     'combination': 'filter',\n",
    "    # },\n",
    "    {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_002115',\n",
    "        #'experiment_regex': r'steeredtrue_filteredfalse_guidedtrue_guidance0.3_minLength15_numModelCalls100_uspto_hard_\\d+',\n",
    "        'method_name': 'Rsmiles-TG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    },\n",
    "        {\n",
    "        #'experiment_regex': r'rootaligned_rsmiles_uspto_190_fraction1.0_thresh500_dropped_PtoR_aug5_steeredtrue_filteredfalse_guidedtrue_numModelCalls100_uspto_hard_20251112_181942',\n",
    "        'experiment_regex': r'rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_144109',\n",
    "        'method_name': 'Rsmiles-TFG',\n",
    "        'experiment_group': 'search/retro_star',\n",
    "        'category': '$\\\\times$',\n",
    "        'criteria': 'reaction_type',\n",
    "        'trained_on': rsmilestg,\n",
    "        'combination': 'filter',\n",
    "    }\n",
    "]\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "e0e23300",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934']\n",
      "Loading results for neuralsym_no_guidance_steeredfalse_filteredfalse_guidedfalse_numModelCalls100_uspto_hard_20251103_145934\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251121_062711']\n",
      "Loading results for neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251121_062711\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718']\n",
      "Loading results for neuralsym_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance0_length0_numModelCalls100_uspto_hard_20251121_062718\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229']\n",
      "Loading results for rootaligned_no_guidance_steeredfalse_filteredfalse_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251119_122229\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144040']\n",
      "Loading results for rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedfalse_guidance0_length0_numModelCalls100_uspto_hard_20251116_144040\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance20_length10_numModelCalls100_uspto_hard_20251116_144032']\n",
      "Loading results for rootaligned_max_tanimoto_steeredfalse_filteredtrue_guidedtrue_guidance20_length10_numModelCalls100_uspto_hard_20251116_144032\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_002115']\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredfalse_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_002115\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "Loading from ['rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_144109']\n",
      "Loading results for rootaligned_max_tanimoto_steeredtrue_filteredtrue_guidedtrue_guidance20_length5_numModelCalls100_uspto_hard_20251116_144109\n",
      "----------------------------------------------------------------------------------------------------\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>total_targets</th>\n",
       "      <th>solved_targets</th>\n",
       "      <th>solve_rate</th>\n",
       "      <th>solve_rate_with_sm</th>\n",
       "      <th>solved_targets_indices</th>\n",
       "      <th>solved_with_sm_indices</th>\n",
       "      <th>avg_nodes_explored</th>\n",
       "      <th>avg_model_calls</th>\n",
       "      <th>avg_time_taken</th>\n",
       "      <th>avg_routes_per_target</th>\n",
       "      <th>...</th>\n",
       "      <th>target_avg_contains_starting_material</th>\n",
       "      <th>num_routes_with_sm</th>\n",
       "      <th>avg_targets_with_exact_match_route</th>\n",
       "      <th>avg_targets_with_round_trip_route</th>\n",
       "      <th>avg_targets_with_rxn_name_match_route</th>\n",
       "      <th>avg_predicted_route_length</th>\n",
       "      <th>avg_true_route_length</th>\n",
       "      <th>avg_route_length_diff</th>\n",
       "      <th>avg_targets_with_exact_length_match</th>\n",
       "      <th>method</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>190</td>\n",
       "      <td>90</td>\n",
       "      <td>0.473684</td>\n",
       "      <td>0.163158</td>\n",
       "      <td>[2, 3, 4, 5, 8, 15, 16, 20, 25, 28, 30, 31, 32...</td>\n",
       "      <td>[2, 16, 20, 35, 41, 53, 56, 58, 59, 70, 72, 73...</td>\n",
       "      <td>17622.489474</td>\n",
       "      <td>87.963158</td>\n",
       "      <td>28.442381</td>\n",
       "      <td>1.357895</td>\n",
       "      <td>...</td>\n",
       "      <td>0.163158</td>\n",
       "      <td>0.127500</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.105263</td>\n",
       "      <td>0.042105</td>\n",
       "      <td>6.239537</td>\n",
       "      <td>5.900000</td>\n",
       "      <td>1.811019</td>\n",
       "      <td>0.126316</td>\n",
       "      <td>NeuralSym-unguided</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>190</td>\n",
       "      <td>7</td>\n",
       "      <td>0.036842</td>\n",
       "      <td>0.031579</td>\n",
       "      <td>[10, 30, 108, 129, 154, 162, 163]</td>\n",
       "      <td>[30, 108, 129, 154, 162, 163]</td>\n",
       "      <td>300.521053</td>\n",
       "      <td>4.089474</td>\n",
       "      <td>33.912700</td>\n",
       "      <td>2.726316</td>\n",
       "      <td>...</td>\n",
       "      <td>0.031579</td>\n",
       "      <td>0.010782</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>5.577631</td>\n",
       "      <td>3.428571</td>\n",
       "      <td>2.819010</td>\n",
       "      <td>0.031579</td>\n",
       "      <td>NeuralSym-F</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>190</td>\n",
       "      <td>7</td>\n",
       "      <td>0.036842</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>[10, 30, 108, 129, 154, 162, 163]</td>\n",
       "      <td>[30, 108, 129, 162]</td>\n",
       "      <td>323.584211</td>\n",
       "      <td>3.636842</td>\n",
       "      <td>33.821877</td>\n",
       "      <td>2.847368</td>\n",
       "      <td>...</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>0.009968</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>5.752866</td>\n",
       "      <td>3.428571</td>\n",
       "      <td>2.371913</td>\n",
       "      <td>0.031579</td>\n",
       "      <td>NeuralSym-FG</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>190</td>\n",
       "      <td>153</td>\n",
       "      <td>0.805263</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...</td>\n",
       "      <td>[3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...</td>\n",
       "      <td>1071.631579</td>\n",
       "      <td>9.136842</td>\n",
       "      <td>630.115272</td>\n",
       "      <td>15.563158</td>\n",
       "      <td>...</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>0.083437</td>\n",
       "      <td>0.005263</td>\n",
       "      <td>0.089474</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>3.112590</td>\n",
       "      <td>6.516340</td>\n",
       "      <td>3.704284</td>\n",
       "      <td>0.221053</td>\n",
       "      <td>Rsmiles-unguided</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>190</td>\n",
       "      <td>38</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>0.184211</td>\n",
       "      <td>[2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...</td>\n",
       "      <td>[2, 10, 11, 13, 16, 26, 29, 42, 47, 54, 55, 77...</td>\n",
       "      <td>125.436842</td>\n",
       "      <td>1.994737</td>\n",
       "      <td>148.235908</td>\n",
       "      <td>8.063158</td>\n",
       "      <td>...</td>\n",
       "      <td>0.184211</td>\n",
       "      <td>0.125197</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>0.026316</td>\n",
       "      <td>0.010526</td>\n",
       "      <td>2.134782</td>\n",
       "      <td>4.236842</td>\n",
       "      <td>2.502016</td>\n",
       "      <td>0.063158</td>\n",
       "      <td>Rsmiles-F</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>190</td>\n",
       "      <td>38</td>\n",
       "      <td>0.200000</td>\n",
       "      <td>0.194737</td>\n",
       "      <td>[2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...</td>\n",
       "      <td>[2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...</td>\n",
       "      <td>131.742105</td>\n",
       "      <td>1.936842</td>\n",
       "      <td>148.605978</td>\n",
       "      <td>8.568421</td>\n",
       "      <td>...</td>\n",
       "      <td>0.194737</td>\n",
       "      <td>0.126603</td>\n",
       "      <td>0.015789</td>\n",
       "      <td>0.026316</td>\n",
       "      <td>0.015789</td>\n",
       "      <td>2.285888</td>\n",
       "      <td>4.236842</td>\n",
       "      <td>2.359069</td>\n",
       "      <td>0.073684</td>\n",
       "      <td>Rsmiles-FG</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>190</td>\n",
       "      <td>161</td>\n",
       "      <td>0.847368</td>\n",
       "      <td>0.631579</td>\n",
       "      <td>[0, 1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14...</td>\n",
       "      <td>[0, 1, 2, 3, 4, 9, 10, 11, 12, 13, 14, 15, 16,...</td>\n",
       "      <td>1880.047368</td>\n",
       "      <td>6.884211</td>\n",
       "      <td>640.200369</td>\n",
       "      <td>66.842105</td>\n",
       "      <td>...</td>\n",
       "      <td>0.631579</td>\n",
       "      <td>0.320232</td>\n",
       "      <td>0.021053</td>\n",
       "      <td>0.089474</td>\n",
       "      <td>0.073684</td>\n",
       "      <td>2.826685</td>\n",
       "      <td>5.627329</td>\n",
       "      <td>2.942743</td>\n",
       "      <td>0.284211</td>\n",
       "      <td>Rsmiles-TG</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>190</td>\n",
       "      <td>35</td>\n",
       "      <td>0.184211</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>[2, 10, 11, 13, 16, 22, 26, 29, 30, 42, 55, 70...</td>\n",
       "      <td>[2, 10, 11, 13, 16, 22, 26, 29, 30, 42, 55, 77...</td>\n",
       "      <td>126.657895</td>\n",
       "      <td>1.731579</td>\n",
       "      <td>163.408728</td>\n",
       "      <td>7.321053</td>\n",
       "      <td>...</td>\n",
       "      <td>0.173684</td>\n",
       "      <td>0.118839</td>\n",
       "      <td>0.015789</td>\n",
       "      <td>0.036842</td>\n",
       "      <td>0.015789</td>\n",
       "      <td>1.989789</td>\n",
       "      <td>3.885714</td>\n",
       "      <td>2.200719</td>\n",
       "      <td>0.063158</td>\n",
       "      <td>Rsmiles-TFG</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>8 rows × 33 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "   total_targets  solved_targets  solve_rate  solve_rate_with_sm  \\\n",
       "0            190              90    0.473684            0.163158   \n",
       "1            190               7    0.036842            0.031579   \n",
       "2            190               7    0.036842            0.021053   \n",
       "3            190             153    0.805263            0.173684   \n",
       "4            190              38    0.200000            0.184211   \n",
       "5            190              38    0.200000            0.194737   \n",
       "6            190             161    0.847368            0.631579   \n",
       "7            190              35    0.184211            0.173684   \n",
       "\n",
       "                              solved_targets_indices  \\\n",
       "0  [2, 3, 4, 5, 8, 15, 16, 20, 25, 28, 30, 31, 32...   \n",
       "1                  [10, 30, 108, 129, 154, 162, 163]   \n",
       "2                  [10, 30, 108, 129, 154, 162, 163]   \n",
       "3  [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,...   \n",
       "4  [2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...   \n",
       "5  [2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...   \n",
       "6  [0, 1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14...   \n",
       "7  [2, 10, 11, 13, 16, 22, 26, 29, 30, 42, 55, 70...   \n",
       "\n",
       "                              solved_with_sm_indices  avg_nodes_explored  \\\n",
       "0  [2, 16, 20, 35, 41, 53, 56, 58, 59, 70, 72, 73...        17622.489474   \n",
       "1                      [30, 108, 129, 154, 162, 163]          300.521053   \n",
       "2                                [30, 108, 129, 162]          323.584211   \n",
       "3  [3, 11, 13, 14, 16, 35, 36, 38, 50, 51, 53, 70...         1071.631579   \n",
       "4  [2, 10, 11, 13, 16, 26, 29, 42, 47, 54, 55, 77...          125.436842   \n",
       "5  [2, 10, 11, 13, 16, 26, 29, 30, 42, 47, 54, 55...          131.742105   \n",
       "6  [0, 1, 2, 3, 4, 9, 10, 11, 12, 13, 14, 15, 16,...         1880.047368   \n",
       "7  [2, 10, 11, 13, 16, 22, 26, 29, 30, 42, 55, 77...          126.657895   \n",
       "\n",
       "   avg_model_calls  avg_time_taken  avg_routes_per_target  ...  \\\n",
       "0        87.963158       28.442381               1.357895  ...   \n",
       "1         4.089474       33.912700               2.726316  ...   \n",
       "2         3.636842       33.821877               2.847368  ...   \n",
       "3         9.136842      630.115272              15.563158  ...   \n",
       "4         1.994737      148.235908               8.063158  ...   \n",
       "5         1.936842      148.605978               8.568421  ...   \n",
       "6         6.884211      640.200369              66.842105  ...   \n",
       "7         1.731579      163.408728               7.321053  ...   \n",
       "\n",
       "   target_avg_contains_starting_material  num_routes_with_sm  \\\n",
       "0                               0.163158            0.127500   \n",
       "1                               0.031579            0.010782   \n",
       "2                               0.021053            0.009968   \n",
       "3                               0.173684            0.083437   \n",
       "4                               0.184211            0.125197   \n",
       "5                               0.194737            0.126603   \n",
       "6                               0.631579            0.320232   \n",
       "7                               0.173684            0.118839   \n",
       "\n",
       "   avg_targets_with_exact_match_route  avg_targets_with_round_trip_route  \\\n",
       "0                            0.010526                           0.105263   \n",
       "1                            0.005263                           0.010526   \n",
       "2                            0.005263                           0.010526   \n",
       "3                            0.005263                           0.089474   \n",
       "4                            0.010526                           0.026316   \n",
       "5                            0.015789                           0.026316   \n",
       "6                            0.021053                           0.089474   \n",
       "7                            0.015789                           0.036842   \n",
       "\n",
       "   avg_targets_with_rxn_name_match_route  avg_predicted_route_length  \\\n",
       "0                               0.042105                    6.239537   \n",
       "1                               0.010526                    5.577631   \n",
       "2                               0.010526                    5.752866   \n",
       "3                               0.100000                    3.112590   \n",
       "4                               0.010526                    2.134782   \n",
       "5                               0.015789                    2.285888   \n",
       "6                               0.073684                    2.826685   \n",
       "7                               0.015789                    1.989789   \n",
       "\n",
       "   avg_true_route_length  avg_route_length_diff  \\\n",
       "0               5.900000               1.811019   \n",
       "1               3.428571               2.819010   \n",
       "2               3.428571               2.371913   \n",
       "3               6.516340               3.704284   \n",
       "4               4.236842               2.502016   \n",
       "5               4.236842               2.359069   \n",
       "6               5.627329               2.942743   \n",
       "7               3.885714               2.200719   \n",
       "\n",
       "   avg_targets_with_exact_length_match              method  \n",
       "0                             0.126316  NeuralSym-unguided  \n",
       "1                             0.031579         NeuralSym-F  \n",
       "2                             0.031579        NeuralSym-FG  \n",
       "3                             0.221053    Rsmiles-unguided  \n",
       "4                             0.063158           Rsmiles-F  \n",
       "5                             0.073684          Rsmiles-FG  \n",
       "6                             0.284211          Rsmiles-TG  \n",
       "7                             0.063158         Rsmiles-TFG  \n",
       "\n",
       "[8 rows x 33 columns]"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "aggregates = aggregate_guided_search_results_with_selection(\n",
    "    experiment_info=experiment_info,\n",
    "    project_root=PROJECT_ROOT,\n",
    "    experiment_dir='experiments',\n",
    "    selection_criteria='tanimoto'\n",
    ")\n",
    "\n",
    "# Convert to DataFrame for easy viewing\n",
    "aggregates_df = pd.DataFrame(aggregates)\n",
    "\n",
    "aggregates_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "6ad2562d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['total_targets', 'solved_targets', 'solve_rate', 'solve_rate_with_sm',\n",
       "       'solved_targets_indices', 'solved_with_sm_indices',\n",
       "       'avg_nodes_explored', 'avg_model_calls', 'avg_time_taken',\n",
       "       'avg_routes_per_target', 'avg_num_nonoverlapping_routes',\n",
       "       'dataset_avg_exact_match', 'dataset_avg_round_trip',\n",
       "       'dataset_avg_rxn_type_match', 'dataset_avg_tanimoto_to_target',\n",
       "       'dataset_avg_tanimoto_to_sm', 'dataset_avg_rxn_name_match',\n",
       "       'target_avg_exact_match', 'target_avg_round_trip',\n",
       "       'target_avg_rxn_type_match', 'target_avg_tanimoto_to_target',\n",
       "       'target_avg_tanimoto_to_sm', 'target_avg_rxn_name_match',\n",
       "       'target_avg_contains_starting_material', 'num_routes_with_sm',\n",
       "       'avg_targets_with_exact_match_route',\n",
       "       'avg_targets_with_round_trip_route', 'avg_predicted_route_length',\n",
       "       'avg_true_route_length', 'avg_route_length_diff',\n",
       "       'avg_targets_with_exact_length_match', 'method'],\n",
       "      dtype='object')"
      ]
     },
     "execution_count": 21,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "aggregates_df.columns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "9104f482",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_metrics_tanimoto_mixed.tex\n",
      "LaTeX table saved to: /Users/laabidn1/multiguide/paper/iclr2026/tables/search_target_metrics_tanimoto_mixed.tex\n"
     ]
    }
   ],
   "source": [
    "_ = get_search_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates, \n",
    "    table_name='search_metrics_tanimoto_mixed.tex',\n",
    "    save_table=True,\n",
    "    caption='Search metrics on USPTO-190 guided towards a specific starting material.',\n",
    "    highlight_per_group=False\n",
    ")\n",
    "\n",
    "_ = get_search_target_metrics_table_tanimoto(\n",
    "    experiment_info, \n",
    "    aggregates,\n",
    "    table_name='search_target_metrics_tanimoto_mixed.tex',\n",
    "    save_table=True,\n",
    "    caption='Quality of routes generated by search methods on USPTO-190 guided towards a specific starting material.',\n",
    "    highlight_per_group=False\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2aa2ff51",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "syntheseus-in-python10",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
