{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "13231426",
   "metadata": {},
   "outputs": [],
   "source": [
    "%load_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 101,
   "id": "9362000d",
   "metadata": {},
   "outputs": [],
   "source": [
    "#from multiguide.evaluation.helpers import extract_reactions\n",
    "import pandas as pd\n",
    "import json\n",
    "import os\n",
    "\n",
    "from multiguide.helpers import PROJECT_ROOT\n",
    "from multiguide.evaluation.helpers import load_experiment_results, select_best_experiment_per_product, _calculate_per_experiment_metrics\n",
    "from multiguide.evaluation.helpers import simplify_metrics, calculate_route_completion_rates, jaccard_similarity"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "9ffe86d7",
   "metadata": {},
   "source": [
    "# Latex table for reaction type guidance"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 66,
   "id": "e764808d",
   "metadata": {},
   "outputs": [],
   "source": [
    "experiment_dir = 'experiments/manual_synthesis'\n",
    "\n",
    "# Example usage\n",
    "experiment_info = [\n",
    "    {\n",
    "        'experiment_regex': r'route_similarity_data_routes190_seed42_modelrootaligned_steeredfalse_guidance0.0_length0_results100_candidates53_time20251117_142029',\n",
    "        'method_name': 'Rsmiles',\n",
    "        'experiment_group': 'no_guidance',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'route_similarity_data_routes190_seed42_modelrootaligned_steeredtrue_guidance\\d+\\.?\\d*_length\\d+_results100_candidates53_time\\d+',\n",
    "        'method_name': 'Rsmiles',\n",
    "        'experiment_group': 'reaction_type',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 71,
   "id": "00daa967",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loading results for route_similarity_data_routes190_seed42_modelrootaligned_steeredfalse_guidance0.0_length0_results100_candidates53_time20251117_142029 from /Users/laabidn1/multiguide/experiments/manual_synthesis/no_guidance\n",
      "Loading results for route_similarity_data_routes190_seed42_modelrootaligned_steeredtrue_guidance0.3_length15_results100_candidates53_time20251117_142008 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n",
      "Loading results for route_similarity_data_routes190_seed42_modelrootaligned_steeredtrue_guidance1.5_length10_results100_candidates53_time20251117_153015 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n",
      "Loading results for route_similarity_data_routes190_seed42_modelrootaligned_steeredtrue_guidance3.0_length15_results100_candidates53_time20251117_164133 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n",
      "Loading results for route_similarity_data_routes190_seed42_modelrootaligned_steeredtrue_guidance5.0_length10_results100_candidates53_time20251117_165103 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n",
      "Loading results for route_similarity_data_routes190_seed42_modelrootaligned_steeredtrue_guidance3.0_length10_results100_candidates53_time20251117_162201 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n",
      "Loading results for route_similarity_data_routes190_seed42_modelrootaligned_steeredtrue_guidance0.5_length15_results100_candidates53_time20251117_125709 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n",
      "Loading results for route_similarity_data_routes190_seed42_modelrootaligned_steeredtrue_guidance1.5_length15_results100_candidates53_time20251117_143641 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n"
     ]
    }
   ],
   "source": [
    "aggregates = []\n",
    "for exp in experiment_info:\n",
    "    experiment_regex = exp['experiment_regex']\n",
    "    method_name = exp['method_name']\n",
    "    experiment_group = exp['experiment_group']\n",
    "    experiment_filters = {'experiment_regex': experiment_regex}\n",
    "    results = load_experiment_results(PROJECT_ROOT, experiment_dir, experiment_group, experiment_filters)\n",
    "    guided_data, guided_experiments = select_best_experiment_per_product(\n",
    "        list_dfs=results.values(), \n",
    "        list_experiment_names=results.keys()\n",
    "    )\n",
    "    guided_quality_metrics = _calculate_per_experiment_metrics(guided_data)\n",
    "    guided_quality_metrics = simplify_metrics(guided_quality_metrics)\n",
    "    true_routes_path = 'route_similarity_data/processed/Strychnine_routes.json'\n",
    "    full_true_routes_path = os.path.join(PROJECT_ROOT, 'data', true_routes_path)\n",
    "    with open(full_true_routes_path, 'r') as f:\n",
    "        true_routes = json.load(f)\n",
    "    route_completion = calculate_route_completion_rates(\n",
    "        results, true_routes, use_starting_material=False, max_steps=100\n",
    "    )\n",
    "    guided_quality_metrics['completion_rate'] = route_completion['mixed_param_completion']['completion_rate']\n",
    "    guided_quality_metrics['method'] = method_name\n",
    "    guided_quality_metrics['route_completion'] = route_completion\n",
    "    aggregates.append(guided_quality_metrics)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 72,
   "id": "0841ffd4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "0\n",
      "setps_solved 7/16\n",
      "setps_solved 9/21\n",
      "setps_solved 3/17\n",
      "setps_solved 3/16\n",
      "setps_solved 8/14\n",
      "setps_solved 9/18\n",
      "setps_solved 1/9\n",
      "setps_solved 2/12\n",
      "setps_solved 5/16\n",
      "setps_solved 2/12\n",
      "setps_solved 7/14\n",
      "setps_solved 11/26\n",
      "----------------------------------------------------------------------------------------------------\n",
      "1\n",
      "setps_solved 7/16\n",
      "setps_solved 9/21\n",
      "setps_solved 4/17\n",
      "setps_solved 3/16\n",
      "setps_solved 8/14\n",
      "setps_solved 11/18\n",
      "setps_solved 1/9\n",
      "setps_solved 3/12\n",
      "setps_solved 5/16\n",
      "setps_solved 2/12\n",
      "setps_solved 7/14\n",
      "setps_solved 11/26\n"
     ]
    }
   ],
   "source": [
    "for agg_idx in range(len(aggregates)):\n",
    "    print('-'*100)\n",
    "    print(f'{agg_idx}')\n",
    "    route_details = aggregates[agg_idx]['route_completion']['mixed_param_completion']['route_details']\n",
    "    for route_info in route_details:\n",
    "        print(f'setps_solved {route_info[\"steps_solved\"]}/{route_info[\"total_steps\"]}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 73,
   "id": "8023fb0f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "0\n",
      "----------------------------------------------------------------------------------------------------\n",
      "1\n",
      "steps_solved_by_agg1_not_agg0: [(2, 7), (2, 16), (5, 14), (5, 16), (7, 8)]\n",
      "steps_solved_by_agg0_not_agg1: [(2, 12)]\n"
     ]
    }
   ],
   "source": [
    "results_per_agg = {\n",
    "}\n",
    "for agg_idx in range(len(aggregates)):\n",
    "    results_per_agg[agg_idx] = {\n",
    "        'steps_solved': [],\n",
    "    }\n",
    "    print('-'*100)\n",
    "    print(f'{agg_idx}')\n",
    "    route_details = aggregates[agg_idx]['route_completion']['mixed_param_completion']['route_details']\n",
    "    for route_idx, route_info in enumerate(route_details):\n",
    "        for step_idx, step_result in enumerate(route_info['step_results']):\n",
    "            if step_result['solved']:\n",
    "                results_per_agg[agg_idx]['steps_solved'].append((route_idx, step_idx))\n",
    "\n",
    "# find steps solved by agg 1 and not agg 0\n",
    "steps_solved_by_agg1_not_agg0 = [step for step in results_per_agg[1]['steps_solved'] if step not in results_per_agg[0]['steps_solved']]\n",
    "steps_solved_by_agg0_not_agg1 = [step for step in results_per_agg[0]['steps_solved'] if step not in results_per_agg[1]['steps_solved']]\n",
    "print(f'steps_solved_by_agg1_not_agg0: {steps_solved_by_agg1_not_agg0}')\n",
    "print(f'steps_solved_by_agg0_not_agg1: {steps_solved_by_agg0_not_agg1}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 87,
   "id": "08d20057",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "0\n",
      "completion_rate: 0.0\n",
      "perc_samples_per_product: 0.7238095238095238\n",
      "percentage_products_with_exact_match: 0.8095238095238095\n",
      "percentage_products_with_class_correct: 1.0\n",
      "perc_class_correct_samples_per_product: 0.2333333333333333\n",
      "percentage_products_with_rxn_name_correct: 1.0\n",
      "avg_rxn_name_correct_samples_per_product: 11.333333333333334\n",
      "percentage_products_with_round_trip_correct: 0.9047619047619048\n",
      "perc_round_trip_correct_samples_per_product: 0.06210526315789473\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "1\n",
      "completion_rate: 0.0\n",
      "perc_samples_per_product: 0.7757142857142857\n",
      "percentage_products_with_exact_match: 0.8095238095238095\n",
      "percentage_products_with_class_correct: 1.0\n",
      "perc_class_correct_samples_per_product: 0.26\n",
      "percentage_products_with_rxn_name_correct: 1.0\n",
      "avg_rxn_name_correct_samples_per_product: 12.19047619047619\n",
      "percentage_products_with_round_trip_correct: 0.9047619047619048\n",
      "perc_round_trip_correct_samples_per_product: 0.0668421052631579\n",
      "----------------------------------------------------------------------------------------------------\n"
     ]
    }
   ],
   "source": [
    "\n",
    "\n",
    "# perc_samples_per_product\n",
    "# percentage_products_with_exact_match\n",
    "# percentage_products_with_class_correct\n",
    "# perc_class_correct_samples_per_product\n",
    "# percentage_products_with_rxn_name_correct\n",
    "# avg_rxn_name_correct_samples_per_product\n",
    "keys = ['completion_rate', 'perc_samples_per_product', \n",
    "'percentage_products_with_exact_match', 'percentage_products_with_class_correct', \n",
    "'perc_class_correct_samples_per_product', 'percentage_products_with_rxn_name_correct', \n",
    "'avg_rxn_name_correct_samples_per_product', 'percentage_products_with_round_trip_correct',\n",
    "'perc_round_trip_correct_samples_per_product']\n",
    "\n",
    "for agg_idx in range(len(aggregates)):\n",
    "    print('-'*100)\n",
    "    print(f'{agg_idx}')\n",
    "    for key in keys:\n",
    "        print(f'{key}: {aggregates[agg_idx][key]}')\n",
    "    print('-'*100)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "7f0fa640",
   "metadata": {},
   "source": [
    "# Astro..."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 83,
   "id": "a460dc4d",
   "metadata": {},
   "outputs": [],
   "source": [
    "experiment_dir = 'experiments/manual_synthesis'\n",
    "true_routes_path = 'route_similarity_data/processed/Atorvastatin_routes.json'\n",
    "\n",
    "# Example usage\n",
    "experiment_info = [\n",
    "    {\n",
    "        'experiment_regex': r'Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056',\n",
    "        'method_name': 'Rsmiles',\n",
    "        'experiment_group': 'no_guidance',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "    {\n",
    "        'experiment_regex': r'Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredtrue_guidance\\d+\\.?\\d*_length\\d+_results100_candidates53_time\\d+',\n",
    "        'method_name': 'Rsmiles',\n",
    "        'experiment_group': 'reaction_type',\n",
    "        'category': 'N.T.'\n",
    "    },\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 99,
   "id": "fb4d444b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loading results for Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056 from /Users/laabidn1/multiguide/experiments/manual_synthesis/no_guidance\n",
      "Loading results for Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredtrue_guidance5.0_length10_results100_candidates53_time20251117_175437 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n",
      "Loading results for Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredtrue_guidance1.5_length15_results100_candidates53_time20251117_175843 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n",
      "Loading results for Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredtrue_guidance0.5_length10_results100_candidates53_time20251117_175945 from /Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type\n"
     ]
    }
   ],
   "source": [
    "aggregates = []\n",
    "all_guided_data = []\n",
    "for exp in experiment_info:\n",
    "    experiment_regex = exp['experiment_regex']\n",
    "    method_name = exp['method_name']\n",
    "    experiment_group = exp['experiment_group']\n",
    "    experiment_filters = {'experiment_regex': experiment_regex}\n",
    "    results = load_experiment_results(PROJECT_ROOT, experiment_dir, experiment_group, experiment_filters)\n",
    "    guided_data, guided_experiments = select_best_experiment_per_product(\n",
    "        list_dfs=results.values(), \n",
    "        list_experiment_names=results.keys()\n",
    "    )\n",
    "    all_guided_data.append(guided_data)\n",
    "    guided_quality_metrics = _calculate_per_experiment_metrics(guided_data)\n",
    "    guided_quality_metrics = simplify_metrics(guided_quality_metrics)\n",
    "    full_true_routes_path = os.path.join(PROJECT_ROOT, 'data', true_routes_path)\n",
    "    with open(full_true_routes_path, 'r') as f:\n",
    "        true_routes = json.load(f)\n",
    "    route_completion = calculate_route_completion_rates(\n",
    "        results, true_routes, use_starting_material=False, max_steps=100\n",
    "    )\n",
    "    guided_quality_metrics['completion_rate'] = route_completion['mixed_param_completion']['completion_rate']\n",
    "    guided_quality_metrics['method'] = method_name\n",
    "    guided_quality_metrics['route_completion'] = route_completion\n",
    "    aggregates.append(guided_quality_metrics)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "id": "6295d054",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['product_smi', 'true_reactants', 'true_class',\n",
       "       'true_most_similar_reactants_similarity',\n",
       "       'true_least_similar_reactants_similarity',\n",
       "       'true_most_similar_reactants', 'true_least_similar_reactants',\n",
       "       'true_similarity_to_target', 'conditional_starting_material',\n",
       "       'conditional_target', 'original_target', 'original_starting_material',\n",
       "       'reactant_predictions', 'product_idx', 'sample_index',\n",
       "       'all_pred_reactants_are_bbs', 'pred_tanimoto_to_target',\n",
       "       'pred_tanimoto_to_starting_material', 'topk', 'classifier_output',\n",
       "       'classifier_confidence', 'round_trip_results', 'round_trip_accuracy',\n",
       "       'rxn_insight_info', 'rxn_insight_NAME', 'pred_class',\n",
       "       'experiment_name'],\n",
       "      dtype='object')"
      ]
     },
     "execution_count": 93,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "guided_data.columns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 109,
   "id": "4daf0c90",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(18, 21)"
      ]
     },
     "execution_count": 109,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "smi = 'CC1(C)O[C@H](CCN)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1'\n",
    "smi = 'CC(C)C(=O)C(C(=O)Nc1ccccc1)C(C(=O)c1ccc(F)cc1)c1ccccc1'\n",
    "#smi = 'COC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C'\n",
    "g_data = all_guided_data[0]\n",
    "g_data[g_data['product_smi'] == smi]['true_reactants'].value_counts()\n",
    "predictions_0 = g_data[g_data['product_smi'] == smi]['reactant_predictions'].unique().tolist()\n",
    "g_data_1 = all_guided_data[1]\n",
    "predictions_1 = g_data_1[g_data_1['product_smi'] == smi]['reactant_predictions'].unique().tolist()\n",
    "# CCC(C)C(=O)C(=Cc1ccccc1)C(=O)Nc1ccccc1.O=Cc1ccc(F)cc1\n",
    "#jaccard_similarity(predictions_0, predictions_1)\n",
    "predictions_0\n",
    "#CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1.CO[Na]\n",
    "s = 'CC(C)C(=O)/C(=C/c1ccccc1)C(=O)Nc1ccccc1'\n",
    "s = 'O=Cc1ccc(F)cc1'\n",
    "sum([s in p for p in predictions_0]), sum([s in p for p in predictions_1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 91,
   "id": "fd1e34fa",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[{'route_idx': 0,\n",
       "  'main_target': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O',\n",
       "  'total_steps': 12,\n",
       "  'steps_solved': 9,\n",
       "  'step_results': [{'reaction_idx': 0,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O',\n",
       "    'true_reactants': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1.O',\n",
       "    'true_distance_to_starting_material': 0.970626631853786,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [122],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.2109324758842443],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.9900265957446808],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.6096151958316455],\n",
       "    'true_tanimoto_to_starting_material': [0.970626631853786],\n",
       "    'avg_true_class_matches': [0.13114754098360656]},\n",
       "   {'reaction_idx': 1,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1',\n",
       "    'true_reactants': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)CC(=O)OC(C)(C)C',\n",
       "    'true_distance_to_starting_material': 0.9686274509803922,\n",
       "    'solved': False,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [169],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.2469841269841269],\n",
       "    'max_pred_tanimoto_to_starting_material': [1.0],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.7859454271854459],\n",
       "    'true_tanimoto_to_starting_material': [0.9686274509803922],\n",
       "    'avg_true_class_matches': [0.047337278106508875]},\n",
       "   {'reaction_idx': 2,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)CC(=O)OC(C)(C)C',\n",
       "    'true_reactants': 'CC(=O)OC(C)(C)C.COC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C',\n",
       "    'true_distance_to_starting_material': 0.9946666666666667,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [True],\n",
       "    'num_samples': [51],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.2676232064878353],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.9946666666666668],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.8472075570292343],\n",
       "    'true_tanimoto_to_starting_material': [0.9946666666666667],\n",
       "    'avg_true_class_matches': [0.6470588235294118]},\n",
       "   {'reaction_idx': 3,\n",
       "    'true_product': 'COC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C',\n",
       "    'true_reactants': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1.CO[Na]',\n",
       "    'true_distance_to_starting_material': 0.8987951807228916,\n",
       "    'solved': False,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [70],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1892764857881137],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.9933020763563296],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.6642234562738322],\n",
       "    'true_tanimoto_to_starting_material': [0.8987951807228916],\n",
       "    'avg_true_class_matches': [0.05714285714285714]},\n",
       "   {'reaction_idx': 4,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1',\n",
       "    'true_reactants': 'CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1.CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O',\n",
       "    'true_distance_to_starting_material': 0.8811400848999393,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [True],\n",
       "    'num_samples': [87],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.4198031268094962],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.9718402095612312],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.7595757587061699],\n",
       "    'true_tanimoto_to_starting_material': [0.8811400848999393],\n",
       "    'avg_true_class_matches': [0.2413793103448276]},\n",
       "   {'reaction_idx': 5,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O',\n",
       "    'true_reactants': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1',\n",
       "    'true_distance_to_starting_material': 0.955862977602108,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [55],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.2592592592592592],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.970509383378016],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.7252212186476554],\n",
       "    'true_tanimoto_to_starting_material': [0.955862977602108],\n",
       "    'avg_true_class_matches': [0.14545454545454545]},\n",
       "   {'reaction_idx': 6,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1',\n",
       "    'true_reactants': 'CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1.O=C(C#Cc1ccccc1)Nc1ccccc1',\n",
       "    'true_distance_to_starting_material': 0.36988737403675165,\n",
       "    'solved': False,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [64],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1727447216890595],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.96],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.4166325451879309],\n",
       "    'true_tanimoto_to_starting_material': [0.36988737403675165],\n",
       "    'avg_true_class_matches': [0.6875]},\n",
       "   {'reaction_idx': 7,\n",
       "    'true_product': 'CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1',\n",
       "    'true_reactants': 'CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C',\n",
       "    'true_distance_to_starting_material': 0.33114949374627756,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [54],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1057441253263707],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.3847045191193511],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.19357957031477732],\n",
       "    'true_tanimoto_to_starting_material': [0.33114949374627756],\n",
       "    'avg_true_class_matches': [0.1111111111111111]},\n",
       "   {'reaction_idx': 8,\n",
       "    'true_product': 'O=C(C#Cc1ccccc1)Nc1ccccc1',\n",
       "    'true_reactants': 'Nc1ccccc1.O=C(O)C#Cc1ccccc1',\n",
       "    'true_distance_to_starting_material': 0.0862977602108037,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [40],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.050632911392405],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.3347381095725467],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.12395719616426167],\n",
       "    'true_tanimoto_to_starting_material': [0.0862977602108037],\n",
       "    'avg_true_class_matches': [0.625]},\n",
       "   {'reaction_idx': 9,\n",
       "    'true_product': 'CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C',\n",
       "    'true_reactants': 'CC(C)C(=O)Cl.CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1',\n",
       "    'true_distance_to_starting_material': 0.24705152079453754,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [60],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1080729166666666],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.3695014662756598],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.2181770207323178],\n",
       "    'true_tanimoto_to_starting_material': [0.24705152079453754],\n",
       "    'avg_true_class_matches': [0.5166666666666667]},\n",
       "   {'reaction_idx': 10,\n",
       "    'true_product': 'CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1',\n",
       "    'true_reactants': 'CCOC(=O)C(Br)c1ccc(F)cc1.NCCC1OCCO1',\n",
       "    'true_distance_to_starting_material': 0.1868622448979592,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [41],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.0988219895287958],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.2367447595561035],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.18406678657076592],\n",
       "    'true_tanimoto_to_starting_material': [0.1868622448979592],\n",
       "    'avg_true_class_matches': [0.8292682926829268]},\n",
       "   {'reaction_idx': 11,\n",
       "    'true_product': 'CCOC(=O)C(Br)c1ccc(F)cc1',\n",
       "    'true_reactants': 'CCOC(=O)Cc1ccc(F)cc1.O=C1CCC(=O)N1Br',\n",
       "    'true_distance_to_starting_material': 0.16162266580811332,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [40],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.0765676567656765],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.1741645244215938],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.13555026252497004],\n",
       "    'true_tanimoto_to_starting_material': [0.16162266580811332],\n",
       "    'avg_true_class_matches': [0.325]}]},\n",
       " {'route_idx': 1,\n",
       "  'main_target': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O',\n",
       "  'total_steps': 10,\n",
       "  'steps_solved': 8,\n",
       "  'step_results': [{'reaction_idx': 0,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O',\n",
       "    'true_reactants': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1.O',\n",
       "    'true_distance_to_starting_material': 1.0,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [True],\n",
       "    'num_samples': [122],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.2109324758842443],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.9900265957446808],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.6096151958316455],\n",
       "    'true_tanimoto_to_starting_material': [1.0],\n",
       "    'avg_true_class_matches': [0.13114754098360656]},\n",
       "   {'reaction_idx': 1,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1',\n",
       "    'true_reactants': 'COC(=O)CC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C',\n",
       "    'true_distance_to_starting_material': 0.9669046073977936,\n",
       "    'solved': False,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [True],\n",
       "    'num_samples': [169],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.2469841269841269],\n",
       "    'max_pred_tanimoto_to_starting_material': [1.0],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.7859454271854459],\n",
       "    'true_tanimoto_to_starting_material': [0.9669046073977936],\n",
       "    'avg_true_class_matches': [0.047337278106508875]},\n",
       "   {'reaction_idx': 2,\n",
       "    'true_product': 'COC(=O)CC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C',\n",
       "    'true_reactants': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O.COC(=O)CC(C)=O',\n",
       "    'true_distance_to_starting_material': 0.9427456083279115,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [85],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1693189051559516],\n",
       "    'max_pred_tanimoto_to_starting_material': [1.0],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.8448198384881935],\n",
       "    'true_tanimoto_to_starting_material': [0.9427456083279115],\n",
       "    'avg_true_class_matches': [0.5647058823529412]},\n",
       "   {'reaction_idx': 3,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O',\n",
       "    'true_reactants': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1',\n",
       "    'true_distance_to_starting_material': 0.9455958549222798,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [55],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.2592592592592592],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.970509383378016],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.7252212186476554],\n",
       "    'true_tanimoto_to_starting_material': [0.9455958549222798],\n",
       "    'avg_true_class_matches': [0.14545454545454545]},\n",
       "   {'reaction_idx': 4,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1',\n",
       "    'true_reactants': 'CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1.O=C(C#Cc1ccccc1)Nc1ccccc1',\n",
       "    'true_distance_to_starting_material': 0.3719298245614035,\n",
       "    'solved': False,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [64],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1727447216890595],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.96],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.4166325451879309],\n",
       "    'true_tanimoto_to_starting_material': [0.3719298245614035],\n",
       "    'avg_true_class_matches': [0.6875]},\n",
       "   {'reaction_idx': 5,\n",
       "    'true_product': 'CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1',\n",
       "    'true_reactants': 'CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C',\n",
       "    'true_distance_to_starting_material': 0.3352941176470588,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [54],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1057441253263707],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.3847045191193511],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.19357957031477732],\n",
       "    'true_tanimoto_to_starting_material': [0.3352941176470588],\n",
       "    'avg_true_class_matches': [0.1111111111111111]},\n",
       "   {'reaction_idx': 6,\n",
       "    'true_product': 'O=C(C#Cc1ccccc1)Nc1ccccc1',\n",
       "    'true_reactants': 'Nc1ccccc1.O=C(O)C#Cc1ccccc1',\n",
       "    'true_distance_to_starting_material': 0.08575112830431979,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [40],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.050632911392405],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.3347381095725467],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.12395719616426167],\n",
       "    'true_tanimoto_to_starting_material': [0.08575112830431979],\n",
       "    'avg_true_class_matches': [0.625]},\n",
       "   {'reaction_idx': 7,\n",
       "    'true_product': 'CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C',\n",
       "    'true_reactants': 'CC(C)C(=O)Cl.CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1',\n",
       "    'true_distance_to_starting_material': 0.24786324786324787,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [60],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1080729166666666],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.3695014662756598],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.2181770207323178],\n",
       "    'true_tanimoto_to_starting_material': [0.24786324786324787],\n",
       "    'avg_true_class_matches': [0.5166666666666667]},\n",
       "   {'reaction_idx': 8,\n",
       "    'true_product': 'CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1',\n",
       "    'true_reactants': 'CCOC(=O)C(Br)c1ccc(F)cc1.NCCC1OCCO1',\n",
       "    'true_distance_to_starting_material': 0.18722604884157795,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [41],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.0988219895287958],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.2367447595561035],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.18406678657076592],\n",
       "    'true_tanimoto_to_starting_material': [0.18722604884157795],\n",
       "    'avg_true_class_matches': [0.8292682926829268]},\n",
       "   {'reaction_idx': 9,\n",
       "    'true_product': 'CCOC(=O)C(Br)c1ccc(F)cc1',\n",
       "    'true_reactants': 'CCOC(=O)Cc1ccc(F)cc1.O=C1CCC(=O)N1Br',\n",
       "    'true_distance_to_starting_material': 0.16318785578747627,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [40],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.0765676567656765],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.1741645244215938],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.13555026252497004],\n",
       "    'true_tanimoto_to_starting_material': [0.16318785578747627],\n",
       "    'avg_true_class_matches': [0.325]}]},\n",
       " {'route_idx': 2,\n",
       "  'main_target': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O',\n",
       "  'total_steps': 9,\n",
       "  'steps_solved': 8,\n",
       "  'step_results': [{'reaction_idx': 0,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O',\n",
       "    'true_reactants': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1.O',\n",
       "    'true_distance_to_starting_material': 0.4117983963344788,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [True],\n",
       "    'num_samples': [122],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.2109324758842443],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.9900265957446808],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.6096151958316455],\n",
       "    'true_tanimoto_to_starting_material': [0.4117983963344788],\n",
       "    'avg_true_class_matches': [0.13114754098360656]},\n",
       "   {'reaction_idx': 1,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1',\n",
       "    'true_reactants': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)OC(C)(C)O1',\n",
       "    'true_distance_to_starting_material': 0.4212309429700734,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [True],\n",
       "    'num_samples': [88],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.3786941580756013],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.8678881388621023],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.4523253956699987],\n",
       "    'true_tanimoto_to_starting_material': [0.4212309429700734],\n",
       "    'avg_true_class_matches': [0.03409090909090909]},\n",
       "   {'reaction_idx': 2,\n",
       "    'true_product': 'CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)OC(C)(C)O1',\n",
       "    'true_reactants': 'CC(C)C(=O)C(C(=O)Nc1ccccc1)C(C(=O)c1ccc(F)cc1)c1ccccc1.CC1(C)O[C@H](CCN)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1',\n",
       "    'true_distance_to_starting_material': 0.8,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [True],\n",
       "    'num_samples': [100],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.3919952913478516],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.8],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.45017596911139585],\n",
       "    'true_tanimoto_to_starting_material': [0.8],\n",
       "    'avg_true_class_matches': [0.33]},\n",
       "   {'reaction_idx': 3,\n",
       "    'true_product': 'CC(C)C(=O)C(C(=O)Nc1ccccc1)C(C(=O)c1ccc(F)cc1)c1ccccc1',\n",
       "    'true_reactants': 'CC(C)C(=O)/C(=C/c1ccccc1)C(=O)Nc1ccccc1.O=Cc1ccc(F)cc1',\n",
       "    'true_distance_to_starting_material': 0.37779850746268656,\n",
       "    'solved': False,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [83],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1507692307692307],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.7497656982193065],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.3427733286337904],\n",
       "    'true_tanimoto_to_starting_material': [0.37779850746268656],\n",
       "    'avg_true_class_matches': [0.6385542168674698]},\n",
       "   {'reaction_idx': 4,\n",
       "    'true_product': 'CC1(C)O[C@H](CCN)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1',\n",
       "    'true_reactants': 'CC1(C)O[C@H](CC#N)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1',\n",
       "    'true_distance_to_starting_material': 0.3023457862728063,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [58],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.2024367385192127],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.4008163265306122],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.29759306424646337],\n",
       "    'true_tanimoto_to_starting_material': [0.3023457862728063],\n",
       "    'avg_true_class_matches': [0.3275862068965517]},\n",
       "   {'reaction_idx': 5,\n",
       "    'true_product': 'CC(C)C(=O)/C(=C/c1ccccc1)C(=O)Nc1ccccc1',\n",
       "    'true_reactants': 'CC(C)C(=O)CC(=O)Nc1ccccc1.O=Cc1ccccc1',\n",
       "    'true_distance_to_starting_material': 0.3055555555555556,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [76],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1266375545851528],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.42846094354215],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.24676698568583055],\n",
       "    'true_tanimoto_to_starting_material': [0.3055555555555556],\n",
       "    'avg_true_class_matches': [0.3026315789473684]},\n",
       "   {'reaction_idx': 6,\n",
       "    'true_product': 'CC1(C)O[C@H](CC#N)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1',\n",
       "    'true_reactants': 'COC(C)(C)OC.N#CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1',\n",
       "    'true_distance_to_starting_material': 0.2695570216776626,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [55],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1778618732261116],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.4148329258353708],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.28836786872502584],\n",
       "    'true_tanimoto_to_starting_material': [0.2695570216776626],\n",
       "    'avg_true_class_matches': [0.43636363636363634]},\n",
       "   {'reaction_idx': 7,\n",
       "    'true_product': 'N#CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1',\n",
       "    'true_reactants': 'N#CC[C@@H](O)CC(=O)CC(=O)N(c1ccccc1)c1ccccc1',\n",
       "    'true_distance_to_starting_material': 0.29902912621359223,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [57],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.0961945031712473],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.3008595988538682],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.23287375701916616],\n",
       "    'true_tanimoto_to_starting_material': [0.29902912621359223],\n",
       "    'avg_true_class_matches': [0.12280701754385964]},\n",
       "   {'reaction_idx': 8,\n",
       "    'true_product': 'N#CC[C@@H](O)CC(=O)CC(=O)N(c1ccccc1)c1ccccc1',\n",
       "    'true_reactants': 'CC(=O)N(c1ccccc1)c1ccccc1.CCOC(=O)C[C@H](O)CC#N',\n",
       "    'true_distance_to_starting_material': 0.22590068159688412,\n",
       "    'solved': True,\n",
       "    'working_params': ['Atorvastatin_reactions_routes190_seed42_modelrootaligned_steeredfalse_guidance0_length0_results100_candidates53_time20251117_180056'],\n",
       "    'has_starting_material': [False],\n",
       "    'num_samples': [65],\n",
       "    'min_pred_tanimoto_to_starting_material': [0.1015873015873015],\n",
       "    'max_pred_tanimoto_to_starting_material': [0.3517745302713987],\n",
       "    'mean_pred_tanimoto_to_starting_material': [0.23794780505086066],\n",
       "    'true_tanimoto_to_starting_material': [0.22590068159688412],\n",
       "    'avg_true_class_matches': [0.5692307692307692]}]}]"
      ]
     },
     "execution_count": 91,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "aggregates[0]['route_completion']['mixed_param_completion']['route_details']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 97,
   "id": "6a948283",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "0\n",
      "setps_solved 9/12\n",
      "step 0: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1.O\n",
      "step 1: False\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)CC(=O)OC(C)(C)C\n",
      "step 2: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)CC(=O)OC(C)(C)C\n",
      "step true reactants: CC(=O)OC(C)(C)C.COC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C\n",
      "step 3: False\n",
      "step true product: COC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1.CO[Na]\n",
      "step 4: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1\n",
      "step true reactants: CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1.CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O\n",
      "step 5: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1\n",
      "step 6: False\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1\n",
      "step true reactants: CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1.O=C(C#Cc1ccccc1)Nc1ccccc1\n",
      "step 7: True\n",
      "step true product: CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C\n",
      "step 8: True\n",
      "step true product: O=C(C#Cc1ccccc1)Nc1ccccc1\n",
      "step true reactants: Nc1ccccc1.O=C(O)C#Cc1ccccc1\n",
      "step 9: True\n",
      "step true product: CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C\n",
      "step true reactants: CC(C)C(=O)Cl.CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1\n",
      "step 10: True\n",
      "step true product: CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)C(Br)c1ccc(F)cc1.NCCC1OCCO1\n",
      "step 11: True\n",
      "step true product: CCOC(=O)C(Br)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)Cc1ccc(F)cc1.O=C1CCC(=O)N1Br\n",
      "setps_solved 8/10\n",
      "step 0: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1.O\n",
      "step 1: False\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1\n",
      "step true reactants: COC(=O)CC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C\n",
      "step 2: True\n",
      "step true product: COC(=O)CC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O.COC(=O)CC(C)=O\n",
      "step 3: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1\n",
      "step 4: False\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1\n",
      "step true reactants: CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1.O=C(C#Cc1ccccc1)Nc1ccccc1\n",
      "step 5: True\n",
      "step true product: CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C\n",
      "step 6: True\n",
      "step true product: O=C(C#Cc1ccccc1)Nc1ccccc1\n",
      "step true reactants: Nc1ccccc1.O=C(O)C#Cc1ccccc1\n",
      "step 7: True\n",
      "step true product: CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C\n",
      "step true reactants: CC(C)C(=O)Cl.CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1\n",
      "step 8: True\n",
      "step true product: CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)C(Br)c1ccc(F)cc1.NCCC1OCCO1\n",
      "step 9: True\n",
      "step true product: CCOC(=O)C(Br)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)Cc1ccc(F)cc1.O=C1CCC(=O)N1Br\n",
      "setps_solved 8/9\n",
      "step 0: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1.O\n",
      "step 1: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)OC(C)(C)O1\n",
      "step 2: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)OC(C)(C)O1\n",
      "step true reactants: CC(C)C(=O)C(C(=O)Nc1ccccc1)C(C(=O)c1ccc(F)cc1)c1ccccc1.CC1(C)O[C@H](CCN)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1\n",
      "step 3: False\n",
      "step true product: CC(C)C(=O)C(C(=O)Nc1ccccc1)C(C(=O)c1ccc(F)cc1)c1ccccc1\n",
      "step true reactants: CC(C)C(=O)/C(=C/c1ccccc1)C(=O)Nc1ccccc1.O=Cc1ccc(F)cc1\n",
      "step 4: True\n",
      "step true product: CC1(C)O[C@H](CCN)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1\n",
      "step true reactants: CC1(C)O[C@H](CC#N)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1\n",
      "step 5: True\n",
      "step true product: CC(C)C(=O)/C(=C/c1ccccc1)C(=O)Nc1ccccc1\n",
      "step true reactants: CC(C)C(=O)CC(=O)Nc1ccccc1.O=Cc1ccccc1\n",
      "step 6: True\n",
      "step true product: CC1(C)O[C@H](CC#N)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1\n",
      "step true reactants: COC(C)(C)OC.N#CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step 7: True\n",
      "step true product: N#CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step true reactants: N#CC[C@@H](O)CC(=O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step 8: True\n",
      "step true product: N#CC[C@@H](O)CC(=O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step true reactants: CC(=O)N(c1ccccc1)c1ccccc1.CCOC(=O)C[C@H](O)CC#N\n",
      "----------------------------------------------------------------------------------------------------\n",
      "1\n",
      "setps_solved 9/12\n",
      "step 0: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1.O\n",
      "step 1: False\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)CC(=O)OC(C)(C)C\n",
      "step 2: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)CC(=O)OC(C)(C)C\n",
      "step true reactants: CC(=O)OC(C)(C)C.COC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C\n",
      "step 3: False\n",
      "step true product: COC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1.CO[Na]\n",
      "step 4: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1\n",
      "step true reactants: CC(=O)O[C@@H](c1ccccc1)C(O)(c1ccccc1)c1ccccc1.CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O\n",
      "step 5: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1\n",
      "step 6: False\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1\n",
      "step true reactants: CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1.O=C(C#Cc1ccccc1)Nc1ccccc1\n",
      "step 7: True\n",
      "step true product: CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C\n",
      "step 8: True\n",
      "step true product: O=C(C#Cc1ccccc1)Nc1ccccc1\n",
      "step true reactants: Nc1ccccc1.O=C(O)C#Cc1ccccc1\n",
      "step 9: True\n",
      "step true product: CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C\n",
      "step true reactants: CC(C)C(=O)Cl.CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1\n",
      "step 10: True\n",
      "step true product: CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)C(Br)c1ccc(F)cc1.NCCC1OCCO1\n",
      "step 11: True\n",
      "step true product: CCOC(=O)C(Br)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)Cc1ccc(F)cc1.O=C1CCC(=O)N1Br\n",
      "setps_solved 8/10\n",
      "step 0: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1.O\n",
      "step 1: False\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@@H](O)CC(=O)O1\n",
      "step true reactants: COC(=O)CC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C\n",
      "step 2: True\n",
      "step true product: COC(=O)CC(=O)C[C@H](O)CCn1c(-c2ccc(F)cc2)c(-c2ccccc2)c(C(=O)Nc2ccccc2)c1C(C)C\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O.COC(=O)CC(C)=O\n",
      "step 3: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC=O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1\n",
      "step 4: False\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CCC1OCCO1\n",
      "step true reactants: CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1.O=C(C#Cc1ccccc1)Nc1ccccc1\n",
      "step 5: True\n",
      "step true product: CC(C)C(=O)N(CCC1OCCO1)C(C(=O)O)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C\n",
      "step 6: True\n",
      "step true product: O=C(C#Cc1ccccc1)Nc1ccccc1\n",
      "step true reactants: Nc1ccccc1.O=C(O)C#Cc1ccccc1\n",
      "step 7: True\n",
      "step true product: CCOC(=O)C(c1ccc(F)cc1)N(CCC1OCCO1)C(=O)C(C)C\n",
      "step true reactants: CC(C)C(=O)Cl.CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1\n",
      "step 8: True\n",
      "step true product: CCOC(=O)C(NCCC1OCCO1)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)C(Br)c1ccc(F)cc1.NCCC1OCCO1\n",
      "step 9: True\n",
      "step true product: CCOC(=O)C(Br)c1ccc(F)cc1\n",
      "step true reactants: CCOC(=O)Cc1ccc(F)cc1.O=C1CCC(=O)N1Br\n",
      "setps_solved 8/9\n",
      "step 0: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)O\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1.O\n",
      "step 1: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step true reactants: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)OC(C)(C)O1\n",
      "step 2: True\n",
      "step true product: CC(C)c1c(C(=O)Nc2ccccc2)c(-c2ccccc2)c(-c2ccc(F)cc2)n1CC[C@@H]1C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)OC(C)(C)O1\n",
      "step true reactants: CC(C)C(=O)C(C(=O)Nc1ccccc1)C(C(=O)c1ccc(F)cc1)c1ccccc1.CC1(C)O[C@H](CCN)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1\n",
      "step 3: False\n",
      "step true product: CC(C)C(=O)C(C(=O)Nc1ccccc1)C(C(=O)c1ccc(F)cc1)c1ccccc1\n",
      "step true reactants: CC(C)C(=O)/C(=C/c1ccccc1)C(=O)Nc1ccccc1.O=Cc1ccc(F)cc1\n",
      "step 4: True\n",
      "step true product: CC1(C)O[C@H](CCN)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1\n",
      "step true reactants: CC1(C)O[C@H](CC#N)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1\n",
      "step 5: True\n",
      "step true product: CC(C)C(=O)/C(=C/c1ccccc1)C(=O)Nc1ccccc1\n",
      "step true reactants: CC(C)C(=O)CC(=O)Nc1ccccc1.O=Cc1ccccc1\n",
      "step 6: True\n",
      "step true product: CC1(C)O[C@H](CC#N)C[C@H](CC(=O)N(c2ccccc2)c2ccccc2)O1\n",
      "step true reactants: COC(C)(C)OC.N#CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step 7: True\n",
      "step true product: N#CC[C@@H](O)C[C@@H](O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step true reactants: N#CC[C@@H](O)CC(=O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step 8: True\n",
      "step true product: N#CC[C@@H](O)CC(=O)CC(=O)N(c1ccccc1)c1ccccc1\n",
      "step true reactants: CC(=O)N(c1ccccc1)c1ccccc1.CCOC(=O)C[C@H](O)CC#N\n"
     ]
    }
   ],
   "source": [
    "for agg_idx in range(len(aggregates)):\n",
    "    print('-'*100)\n",
    "    print(f'{agg_idx}')\n",
    "    route_details = aggregates[agg_idx]['route_completion']['mixed_param_completion']['route_details']\n",
    "    for route_info in route_details:\n",
    "        print(f'setps_solved {route_info[\"steps_solved\"]}/{route_info[\"total_steps\"]}')\n",
    "        for step_idx, step_result in enumerate(route_info['step_results']):\n",
    "            print(f'step {step_idx}: {step_result[\"solved\"]}')\n",
    "            print(f'step true product: {route_info[\"step_results\"][step_idx][\"true_product\"]}')\n",
    "            print(f'step true reactants: {route_info[\"step_results\"][step_idx][\"true_reactants\"]}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 86,
   "id": "39b81d18",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "0\n",
      "----------------------------------------------------------------------------------------------------\n",
      "1\n",
      "steps_solved_by_agg1_not_agg0: []\n",
      "steps_solved_by_agg0_not_agg1: []\n"
     ]
    }
   ],
   "source": [
    "results_per_agg = {\n",
    "}\n",
    "for agg_idx in range(len(aggregates)):\n",
    "    results_per_agg[agg_idx] = {\n",
    "        'steps_solved': [],\n",
    "    }\n",
    "    print('-'*100)\n",
    "    print(f'{agg_idx}')\n",
    "    route_details = aggregates[agg_idx]['route_completion']['mixed_param_completion']['route_details']\n",
    "    for route_idx, route_info in enumerate(route_details):\n",
    "        for step_idx, step_result in enumerate(route_info['step_results']):\n",
    "            if step_result['solved']:\n",
    "                results_per_agg[agg_idx]['steps_solved'].append((route_idx, step_idx))\n",
    "\n",
    "# find steps solved by agg 1 and not agg 0\n",
    "steps_solved_by_agg1_not_agg0 = [step for step in results_per_agg[1]['steps_solved'] if step not in results_per_agg[0]['steps_solved']]\n",
    "steps_solved_by_agg0_not_agg1 = [step for step in results_per_agg[0]['steps_solved'] if step not in results_per_agg[1]['steps_solved']]\n",
    "print(f'steps_solved_by_agg1_not_agg0: {steps_solved_by_agg1_not_agg0}')\n",
    "print(f'steps_solved_by_agg0_not_agg1: {steps_solved_by_agg0_not_agg1}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 88,
   "id": "5b914e28",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "----------------------------------------------------------------------------------------------------\n",
      "0\n",
      "completion_rate: 0.0\n",
      "perc_samples_per_product: 0.7238095238095238\n",
      "percentage_products_with_exact_match: 0.8095238095238095\n",
      "percentage_products_with_class_correct: 1.0\n",
      "perc_class_correct_samples_per_product: 0.2333333333333333\n",
      "percentage_products_with_rxn_name_correct: 1.0\n",
      "avg_rxn_name_correct_samples_per_product: 11.333333333333334\n",
      "percentage_products_with_round_trip_correct: 0.9047619047619048\n",
      "perc_round_trip_correct_samples_per_product: 0.06210526315789473\n",
      "----------------------------------------------------------------------------------------------------\n",
      "----------------------------------------------------------------------------------------------------\n",
      "1\n",
      "completion_rate: 0.0\n",
      "perc_samples_per_product: 0.7757142857142857\n",
      "percentage_products_with_exact_match: 0.8095238095238095\n",
      "percentage_products_with_class_correct: 1.0\n",
      "perc_class_correct_samples_per_product: 0.26\n",
      "percentage_products_with_rxn_name_correct: 1.0\n",
      "avg_rxn_name_correct_samples_per_product: 12.19047619047619\n",
      "percentage_products_with_round_trip_correct: 0.9047619047619048\n",
      "perc_round_trip_correct_samples_per_product: 0.0668421052631579\n",
      "----------------------------------------------------------------------------------------------------\n"
     ]
    }
   ],
   "source": [
    "# perc_samples_per_product\n",
    "# percentage_products_with_exact_match\n",
    "# percentage_products_with_class_correct\n",
    "# perc_class_correct_samples_per_product\n",
    "# percentage_products_with_rxn_name_correct\n",
    "# avg_rxn_name_correct_samples_per_product\n",
    "keys = ['completion_rate', 'perc_samples_per_product', \n",
    "'percentage_products_with_exact_match', 'percentage_products_with_class_correct', \n",
    "'perc_class_correct_samples_per_product', 'percentage_products_with_rxn_name_correct', \n",
    "'avg_rxn_name_correct_samples_per_product', 'percentage_products_with_round_trip_correct',\n",
    "'perc_round_trip_correct_samples_per_product']\n",
    "\n",
    "for agg_idx in range(len(aggregates)):\n",
    "    print('-'*100)\n",
    "    print(f'{agg_idx}')\n",
    "    for key in keys:\n",
    "        print(f'{key}: {aggregates[agg_idx][key]}')\n",
    "    print('-'*100)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "803a5382",
   "metadata": {},
   "source": [
    "# Analyze dfs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "68825f78",
   "metadata": {},
   "outputs": [],
   "source": [
    "eval_dir = '/Users/laabidn1/multiguide/experiments/manual_synthesis/reaction_type/route_similarity_data_routes190_seed42_modelrootaligned_steeredtrue_guidance0.5_length15_results100_candidates53_time20251117_125709'\n",
    "dfs = [pd.read_csv(os.path.join(eval_dir, f)) for f in os.listdir(eval_dir) if f.startswith('eval')]\n",
    "df = pd.concat(dfs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0108e0e3",
   "metadata": {},
   "outputs": [],
   "source": [
    "df['topk'].value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ee1a2b6b",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "syntheseus-in-python10",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
