{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "c6aa39ec-eab7-4fe4-b3f8-acda6de31e53",
   "metadata": {},
   "source": [
    "# End-to-End"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "18ae4c5e-92ab-4229-80eb-27ac257c81f4",
   "metadata": {},
   "outputs": [],
   "source": [
    "from GOTabPFN import GraphFeatureOrdering, PIDFSegPCA, TabPFN25Head, TabPFN25Config"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "05840a50-8379-42c2-ac86-afdbcc738d92",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[I 2026-01-21 22:12:10,602] A new study created in memory with name: no-name-b846fbce-3ffd-4749-8477-4f696f031a1f\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[DATA] arcene_combined_encoded.csv | X=(200, 10000) | C=2 | map={0: 0, 1: 1}\n",
      "[GPU ] cuda= True | visible_gpus= 8\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "81b0e74a91dd4aeabef341d68bac9172",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "  0%|          | 0/150 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[I 2026-01-21 22:15:08,807] Trial 0 finished with value: 0.611 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 1.8638900372842315, 'nsc_beta': 0.26210622617823776, 'nsc_Mmin': 16, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 0 with value: 0.611.\n",
      "[I 2026-01-21 22:18:40,189] Trial 1 finished with value: 0.727 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 9, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 1.0904545778210761, 'nsc_beta': 0.2927972976869379, 'nsc_Mmin': 48, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': False, 'tabpfn_seed': 2}. Best is trial 1 with value: 0.727.\n",
      "[I 2026-01-21 22:23:00,452] Trial 2 finished with value: 0.8490000000000001 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 6, 'go_refine_passes': 3, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 1.0508382534881904, 'nsc_beta': 0.09710228429397401, 'nsc_Mmin': 32, 'nsc_Mmax': 128, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 2 with value: 0.8490000000000001.\n",
      "[I 2026-01-21 22:27:33,605] Trial 3 finished with value: 0.655 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 7, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 1.727259204758588, 'nsc_beta': 0.8746038744488647, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 2 with value: 0.8490000000000001.\n",
      "[I 2026-01-21 22:32:01,593] Trial 4 finished with value: 0.872 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 11, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.873459977473469, 'nsc_beta': 0.12376884973139393, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 4 with value: 0.872.\n",
      "[I 2026-01-21 22:34:07,671] Trial 5 finished with value: 0.889 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.2992657980944293, 'nsc_beta': 0.7643010694447602, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 22:39:10,634] Trial 6 pruned. \n",
      "[I 2026-01-21 22:42:35,135] Trial 7 finished with value: 0.746 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.99, 'nsc_gamma': 2.2457809516380003, 'nsc_beta': 0.0768127184943912, 'nsc_Mmin': 64, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 22:47:44,277] Trial 8 finished with value: 0.875 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 10, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 1.9483476581746504, 'nsc_beta': 0.08805074458590133, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 22:52:34,024] Trial 9 pruned. \n",
      "[I 2026-01-21 22:58:07,054] Trial 10 finished with value: 0.857 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 8, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.7171324862390933, 'nsc_beta': 0.6996607815238783, 'nsc_Mmin': 16, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 23:00:50,016] Trial 11 finished with value: 0.879 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.659719394687937, 'nsc_beta': 0.6890912001274871, 'nsc_Mmin': 32, 'nsc_Mmax': 128, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 23:03:31,089] Trial 12 finished with value: 0.8740000000000001 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 2.2673506469969364, 'nsc_beta': 0.6941392316580696, 'nsc_Mmin': 64, 'nsc_Mmax': 128, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 23:06:59,849] Trial 13 finished with value: 0.7709999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.855988067154185, 'nsc_beta': 0.6277014834302466, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 23:11:06,805] Trial 14 finished with value: 0.8830000000000001 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.633252049099552, 'nsc_beta': 0.37591589998824204, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 23:15:08,497] Trial 15 finished with value: 0.888 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.435636696443382, 'nsc_beta': 0.5107591653920608, 'nsc_Mmin': 48, 'nsc_Mmax': 512, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 23:18:21,118] Trial 16 finished with value: 0.873 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 1.6714756317079884, 'nsc_beta': 0.843449356251761, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 23:21:19,678] Trial 17 finished with value: 0.889 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 1.9459417793617477, 'nsc_beta': 0.5054185218330391, 'nsc_Mmin': 48, 'nsc_Mmax': 512, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 5 with value: 0.889.\n",
      "[I 2026-01-21 23:23:35,483] Trial 18 pruned. \n",
      "[I 2026-01-21 23:27:09,340] Trial 19 finished with value: 0.8919999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.342719577255867, 'nsc_beta': 0.8369923182219433, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 19 with value: 0.8919999999999999.\n",
      "[I 2026-01-21 23:29:04,770] Trial 20 pruned. \n",
      "[I 2026-01-21 23:31:10,640] Trial 21 pruned. \n",
      "[I 2026-01-21 23:34:26,723] Trial 22 finished with value: 0.8690000000000001 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.7041235538362067, 'nsc_beta': 0.6098544305090461, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 19 with value: 0.8919999999999999.\n",
      "[I 2026-01-21 23:37:58,842] Trial 23 finished with value: 0.8909999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.9975, 'nsc_gamma': 2.8198387162395244, 'nsc_beta': 0.7159727243772945, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 19 with value: 0.8919999999999999.\n",
      "[I 2026-01-21 23:42:04,844] Trial 24 finished with value: 0.87 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.9975, 'nsc_gamma': 2.6547775079676477, 'nsc_beta': 0.8860309285982307, 'nsc_Mmin': 64, 'nsc_Mmax': 256, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 19 with value: 0.8919999999999999.\n",
      "[I 2026-01-21 23:45:19,698] Trial 25 finished with value: 0.888 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.9354248121688618, 'nsc_beta': 0.5957019283486162, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 19 with value: 0.8919999999999999.\n",
      "[I 2026-01-21 23:49:09,120] Trial 26 pruned. \n",
      "[I 2026-01-21 23:53:36,532] Trial 27 finished with value: 0.883 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.9975, 'nsc_gamma': 2.951883579829571, 'nsc_beta': 0.7177927714018197, 'nsc_Mmin': 16, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 19 with value: 0.8919999999999999.\n",
      "[I 2026-01-21 23:57:50,784] Trial 28 finished with value: 0.9009999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.9975, 'nsc_gamma': 2.419952438073638, 'nsc_beta': 0.6404561818309986, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:01:39,462] Trial 29 finished with value: 0.8780000000000001 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 2.590116937810835, 'nsc_beta': 0.8673356903159256, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:04:32,325] Trial 30 pruned. \n",
      "[I 2026-01-22 00:07:16,177] Trial 31 pruned. \n",
      "[I 2026-01-22 00:11:08,016] Trial 32 pruned. \n",
      "[I 2026-01-22 00:17:25,355] Trial 33 finished with value: 0.8799999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 8, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.9975, 'nsc_gamma': 2.4861832351389777, 'nsc_beta': 0.511306891742265, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:20:57,972] Trial 34 finished with value: 0.8909999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.5507429090425906, 'nsc_beta': 0.7136150798222788, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:23:57,258] Trial 35 finished with value: 0.884 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.3300852862920087, 'nsc_beta': 0.7061503168515213, 'nsc_Mmin': 64, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:27:06,626] Trial 36 finished with value: 0.8859999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.2810381078500517, 'nsc_beta': 0.8498334608521844, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:30:47,492] Trial 37 finished with value: 0.858 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.9975, 'nsc_gamma': 2.905518496577023, 'nsc_beta': 0.5742838611962998, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:34:45,548] Trial 38 finished with value: 0.8829999999999998 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.4989432750653, 'nsc_beta': 0.6015492617747632, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:37:05,688] Trial 39 finished with value: 0.888 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.3205237010071413, 'nsc_beta': 0.7070584551768649, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:39:19,481] Trial 40 pruned. \n",
      "[I 2026-01-22 00:42:53,311] Trial 41 finished with value: 0.878 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.6736073397126714, 'nsc_beta': 0.7035940142938294, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:45:56,618] Trial 42 finished with value: 0.8859999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.403631712844683, 'nsc_beta': 0.49374637371778557, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:48:52,872] Trial 43 finished with value: 0.89 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.546529521813074, 'nsc_beta': 0.8961646054075436, 'nsc_Mmin': 16, 'nsc_Mmax': 512, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:52:18,367] Trial 44 finished with value: 0.8860000000000001 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.7204672294046546, 'nsc_beta': 0.8794182948112711, 'nsc_Mmin': 16, 'nsc_Mmax': 512, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 28 with value: 0.9009999999999999.\n",
      "[I 2026-01-22 00:54:54,977] Trial 45 pruned. \n",
      "[I 2026-01-22 00:57:25,487] Trial 46 finished with value: 0.902 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.3410353411302114, 'nsc_beta': 0.7736434115032446, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 46 with value: 0.902.\n",
      "[I 2026-01-22 01:00:34,493] Trial 47 finished with value: 0.9059999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.1534471124535814, 'nsc_beta': 0.8882602627359169, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:04:00,177] Trial 48 finished with value: 0.877 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.0075785962510757, 'nsc_beta': 0.6130768573979248, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:07:05,513] Trial 49 finished with value: 0.8910000000000002 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.142095870319747, 'nsc_beta': 0.7148082582861239, 'nsc_Mmin': 48, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:10:13,125] Trial 50 finished with value: 0.884 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.95, 'nsc_gamma': 2.1844690783796206, 'nsc_beta': 0.5868123160624824, 'nsc_Mmin': 64, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:14:06,832] Trial 51 finished with value: 0.8919999999999999 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.372610310347526, 'nsc_beta': 0.521671255160336, 'nsc_Mmin': 16, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:16:10,546] Trial 52 pruned. \n",
      "[I 2026-01-22 01:19:35,995] Trial 53 finished with value: 0.8909999999999999 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.283498089809367, 'nsc_beta': 0.8552921847946098, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:23:03,344] Trial 54 finished with value: 0.8890000000000002 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 1.7244530382300391, 'nsc_beta': 0.894796053316738, 'nsc_Mmin': 48, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:26:50,368] Trial 55 finished with value: 0.8859999999999999 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.205464620669211, 'nsc_beta': 0.5736083336549418, 'nsc_Mmin': 16, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:30:08,422] Trial 56 finished with value: 0.879 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.9975, 'nsc_gamma': 1.8535032055183596, 'nsc_beta': 0.6642952145266315, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:31:54,210] Trial 57 pruned. \n",
      "[I 2026-01-22 01:35:21,058] Trial 58 finished with value: 0.899 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 2.3168291388506086, 'nsc_beta': 0.46256144256349996, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:39:21,836] Trial 59 finished with value: 0.855 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 1.6465071619349199, 'nsc_beta': 0.5964328382444832, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:42:56,889] Trial 60 finished with value: 0.894 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.99, 'nsc_gamma': 2.179205756360312, 'nsc_beta': 0.6670349544644395, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:45:23,021] Trial 61 pruned. \n",
      "[I 2026-01-22 01:47:26,327] Trial 62 pruned. \n",
      "[I 2026-01-22 01:51:30,837] Trial 63 finished with value: 0.8859999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.99, 'nsc_gamma': 2.136105157365709, 'nsc_beta': 0.6518952317415735, 'nsc_Mmin': 64, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:54:19,623] Trial 64 finished with value: 0.8550000000000001 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.99, 'nsc_gamma': 1.8784860075068002, 'nsc_beta': 0.8884235200161648, 'nsc_Mmin': 16, 'nsc_Mmax': 128, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:56:28,015] Trial 65 finished with value: 0.8919999999999999 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.4877228266596942, 'nsc_beta': 0.6014768042222288, 'nsc_Mmin': 48, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 01:59:52,091] Trial 66 finished with value: 0.89 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 2.9435646508172293, 'nsc_beta': 0.7642854085072514, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:03:30,840] Trial 67 finished with value: 0.887 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.0912305202846686, 'nsc_beta': 0.7270868658209446, 'nsc_Mmin': 16, 'nsc_Mmax': 256, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:05:21,254] Trial 68 pruned. \n",
      "[I 2026-01-22 02:10:13,927] Trial 69 finished with value: 0.8460000000000001 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 8, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.3731656971125084, 'nsc_beta': 0.847358931555265, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:13:42,022] Trial 70 finished with value: 0.892 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.4123967135835755, 'nsc_beta': 0.8459664079559895, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:17:53,770] Trial 71 finished with value: 0.8889999999999999 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.4998478164961337, 'nsc_beta': 0.8283922033736838, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:21:39,291] Trial 72 finished with value: 0.899 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.3817109283377076, 'nsc_beta': 0.7611260217351294, 'nsc_Mmin': 64, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:24:18,170] Trial 73 pruned. \n",
      "[I 2026-01-22 02:26:44,818] Trial 74 pruned. \n",
      "[I 2026-01-22 02:29:49,417] Trial 75 finished with value: 0.892 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.666046677427701, 'nsc_beta': 0.885594596642099, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:32:29,099] Trial 76 finished with value: 0.892 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.488491844113254, 'nsc_beta': 0.8669076312558066, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:35:51,213] Trial 77 pruned. \n",
      "[I 2026-01-22 02:38:14,055] Trial 78 pruned. \n",
      "[I 2026-01-22 02:40:39,351] Trial 79 finished with value: 0.889 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.95, 'nsc_gamma': 2.563689602819097, 'nsc_beta': 0.7961712444773009, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:43:14,407] Trial 80 finished with value: 0.892 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.7882189356156992, 'nsc_beta': 0.6172823442264417, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:47:01,240] Trial 81 finished with value: 0.875 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 2, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.500233940430698, 'nsc_beta': 0.8951544763984554, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:49:29,673] Trial 82 pruned. \n",
      "[I 2026-01-22 02:52:36,326] Trial 83 finished with value: 0.8769999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.877326082944783, 'nsc_beta': 0.8923518503108249, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:55:19,944] Trial 84 finished with value: 0.8860000000000001 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.7839638828144095, 'nsc_beta': 0.6833735361479922, 'nsc_Mmin': 32, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 02:57:00,556] Trial 85 pruned. \n",
      "[I 2026-01-22 03:00:18,727] Trial 86 pruned. \n",
      "[I 2026-01-22 03:02:36,856] Trial 87 finished with value: 0.8809999999999999 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.95, 'nsc_gamma': 2.6896387416241754, 'nsc_beta': 0.5979379013653668, 'nsc_Mmin': 64, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:04:06,595] Trial 88 pruned. \n",
      "[I 2026-01-22 03:06:39,266] Trial 89 finished with value: 0.878 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.618738026466258, 'nsc_beta': 0.7291958666395313, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:09:48,864] Trial 90 finished with value: 0.8889999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.4339318656517315, 'nsc_beta': 0.8294605291687022, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:13:16,069] Trial 91 finished with value: 0.879 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.9975, 'nsc_gamma': 2.382043051590435, 'nsc_beta': 0.5258705414297247, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:16:19,215] Trial 92 finished with value: 0.8769999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.559905336745142, 'nsc_beta': 0.5114313392821074, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:19:11,923] Trial 93 finished with value: 0.892 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.745410118688102, 'nsc_beta': 0.8663418341691258, 'nsc_Mmin': 64, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:22:14,757] Trial 94 finished with value: 0.8730000000000001 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.675037129013478, 'nsc_beta': 0.8388268234124394, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:24:37,144] Trial 95 finished with value: 0.878 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'default', 'nsc_tau': 0.99, 'nsc_gamma': 1.947825831579137, 'nsc_beta': 0.41442790950030045, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:26:22,351] Trial 96 pruned. \n",
      "[I 2026-01-22 03:30:03,094] Trial 97 finished with value: 0.9059999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.977122612057703, 'nsc_beta': 0.6113427551863525, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:34:54,715] Trial 98 finished with value: 0.897 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.6202637024057083, 'nsc_beta': 0.4993334367669342, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:38:39,876] Trial 99 pruned. \n",
      "[I 2026-01-22 03:42:30,235] Trial 100 finished with value: 0.8969999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.8546545293479437, 'nsc_beta': 0.6021342652708657, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:46:37,948] Trial 101 finished with value: 0.885 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.9822373720172, 'nsc_beta': 0.6538064053736582, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:49:42,934] Trial 102 finished with value: 0.899 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.0907485261831043, 'nsc_beta': 0.27165704920314937, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:53:33,070] Trial 103 finished with value: 0.8759999999999999 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.2454023296135963, 'nsc_beta': 0.15536109522808833, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 03:56:57,763] Trial 104 finished with value: 0.8969999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.144538543752493, 'nsc_beta': 0.27654358590501044, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 04:00:00,952] Trial 105 finished with value: 0.8860000000000001 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 1.9736245246628126, 'nsc_beta': 0.2722997660085934, 'nsc_Mmin': 16, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 04:05:09,267] Trial 106 finished with value: 0.9049999999999998 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 6, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.55113708542624, 'nsc_beta': 0.5699593396551257, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 04:09:39,237] Trial 107 pruned. \n",
      "[I 2026-01-22 04:13:09,027] Trial 108 finished with value: 0.871 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.56401435068649, 'nsc_beta': 0.3625624040062372, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 04:17:56,668] Trial 109 finished with value: 0.883 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.9552613151292433, 'nsc_beta': 0.44338329531577303, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 47 with value: 0.9059999999999999.\n",
      "[I 2026-01-22 04:20:06,479] Trial 110 pruned. \n",
      "[I 2026-01-22 04:23:03,389] Trial 111 finished with value: 0.9060000000000001 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.2630914693745914, 'nsc_beta': 0.19381705297890106, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 04:26:05,434] Trial 112 finished with value: 0.898 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.512807002949363, 'nsc_beta': 0.32006141241290753, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 04:29:12,526] Trial 113 finished with value: 0.8939999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 2.5291953204832334, 'nsc_beta': 0.28253423430533114, 'nsc_Mmin': 16, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 04:32:37,025] Trial 114 finished with value: 0.889 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.479247280213373, 'nsc_beta': 0.27032901528672976, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 04:37:48,006] Trial 115 finished with value: 0.8919999999999999 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.3538268732383445, 'nsc_beta': 0.5476112273829509, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 04:40:05,899] Trial 116 pruned. \n",
      "[I 2026-01-22 04:44:11,324] Trial 117 finished with value: 0.898 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.616162674140344, 'nsc_beta': 0.8210173174956442, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 04:48:12,046] Trial 118 finished with value: 0.9 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.5771811104875537, 'nsc_beta': 0.8927425353424482, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 04:52:30,534] Trial 119 pruned. \n",
      "[I 2026-01-22 04:57:27,188] Trial 120 finished with value: 0.887 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.1462714254818125, 'nsc_beta': 0.5615131526505746, 'nsc_Mmin': 16, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 04:59:59,961] Trial 121 pruned. \n",
      "[I 2026-01-22 05:05:49,214] Trial 122 finished with value: 0.883 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.9346162744046023, 'nsc_beta': 0.42687995768923404, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 05:08:29,482] Trial 123 pruned. \n",
      "[I 2026-01-22 05:11:02,134] Trial 124 pruned. \n",
      "[I 2026-01-22 05:15:21,176] Trial 125 finished with value: 0.8959999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.7698958202359605, 'nsc_beta': 0.1055443069066141, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 05:19:06,164] Trial 126 finished with value: 0.882 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.6223081480226917, 'nsc_beta': 0.6260309068171015, 'nsc_Mmin': 64, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 05:22:27,427] Trial 127 finished with value: 0.894 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.0182457194356465, 'nsc_beta': 0.053560311684994366, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 05:26:19,199] Trial 128 finished with value: 0.8830000000000001 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.639823353055334, 'nsc_beta': 0.8532609768636694, 'nsc_Mmin': 48, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 05:30:25,649] Trial 129 finished with value: 0.882 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.320227084453448, 'nsc_beta': 0.21197031278410622, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 05:33:54,823] Trial 130 finished with value: 0.887 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 1.7049032685460574, 'nsc_beta': 0.23401550024647452, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 05:36:03,866] Trial 131 pruned. \n",
      "[I 2026-01-22 05:38:28,221] Trial 132 pruned. \n",
      "[I 2026-01-22 05:42:52,372] Trial 133 finished with value: 0.894 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 1.7560887618908225, 'nsc_beta': 0.32890022200202007, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 05:44:58,228] Trial 134 pruned. \n",
      "[I 2026-01-22 05:50:16,885] Trial 135 finished with value: 0.8759999999999999 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 8, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.648071484319429, 'nsc_beta': 0.8530210568634008, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 05:52:08,206] Trial 136 pruned. \n",
      "[I 2026-01-22 05:55:59,938] Trial 137 finished with value: 0.885 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 2.0486834185622875, 'nsc_beta': 0.785995957980608, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:00:04,506] Trial 138 finished with value: 0.889 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 1.727458805866552, 'nsc_beta': 0.16652925828775983, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:03:18,986] Trial 139 finished with value: 0.8859999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.456561523942324, 'nsc_beta': 0.5111809758386435, 'nsc_Mmin': 48, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:07:57,551] Trial 140 finished with value: 0.8780000000000001 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.418739480790951, 'nsc_beta': 0.5803870261270224, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:11:35,063] Trial 141 finished with value: 0.887 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.6550247857878118, 'nsc_beta': 0.05826155425037596, 'nsc_Mmin': 64, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:16:20,315] Trial 142 finished with value: 0.89 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 1.8893233408344554, 'nsc_beta': 0.4608329547967294, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:20:40,250] Trial 143 finished with value: 0.883 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.931127223865209, 'nsc_beta': 0.7558903519434201, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:25:54,595] Trial 144 pruned. \n",
      "[I 2026-01-22 06:28:04,658] Trial 145 pruned. \n",
      "[I 2026-01-22 06:31:55,752] Trial 146 finished with value: 0.8919999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.4266355077608055, 'nsc_beta': 0.10828234834847038, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:35:34,830] Trial 147 finished with value: 0.8969999999999999 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 1.8900931222216557, 'nsc_beta': 0.3633982627311595, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:39:28,892] Trial 148 finished with value: 0.873 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.816533136323188, 'nsc_beta': 0.27505009627592975, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 111 with value: 0.9060000000000001.\n",
      "[I 2026-01-22 06:42:09,905] Trial 149 pruned. \n",
      "\n",
      "================ BEST TRIAL ================\n",
      "mean_acc ± std_acc = 0.906000 ± 0.039713\n",
      "\n",
      "Best hyperparameters:\n",
      "  go_metric: euclidean\n",
      "  go_num_clusters: 4\n",
      "  go_refine_passes: 1\n",
      "  go_direction_select: False\n",
      "  nsc_segmentation: uniform\n",
      "  nsc_m_rule: gamma\n",
      "  nsc_tau: 0.99\n",
      "  nsc_gamma: 2.2630914693745914\n",
      "  nsc_beta: 0.19381705297890106\n",
      "  nsc_Mmin: 16\n",
      "  nsc_Mmax: 640\n",
      "  nsc_lmin: 16\n",
      "  assume_standardized: True\n",
      "  tabpfn_seed: 4\n"
     ]
    }
   ],
   "source": [
    "# ============================================================\n",
    "# ONE CELL (Arcene): OPTUNA with GO-LR ONCE per trial \n",
    "# Per trial:\n",
    "#   1) GO-LR fit on FULL X -> Pi_star (fixed for all folds in that trial)\n",
    "#   2) 5x5 CV folds:\n",
    "#        NSC configure on train only (uses fixed Pi_star)\n",
    "#        compress train/val\n",
    "#        TabPFN fit on train, eval on val\n",
    "# ============================================================\n",
    "\n",
    "import os, sys, gc, random, warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "\n",
    "os.environ.setdefault(\"PYTORCH_CUDA_ALLOC_CONF\", \"expandable_segments:True\")\n",
    "os.environ.setdefault(\"CUDA_DEVICE_ORDER\", \"PCI_BUS_ID\")\n",
    "\n",
    "import optuna\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import torch\n",
    "\n",
    "from sklearn.model_selection import RepeatedStratifiedKFold\n",
    "from sklearn.preprocessing import StandardScaler\n",
    "from sklearn.metrics import accuracy_score\n",
    "from tqdm import tqdm\n",
    "\n",
    "#   GraphFeatureOrdering, pidf_segpca, TabPFN25Head, TabPFN25Config\n",
    "from gotabpfn import GraphFeatureOrdering, pidf_segpca, TabPFN25Head, TabPFN25Config\n",
    "PIDFSegPCA = pidf_segpca  # alias to match your earlier naming\n",
    "\n",
    "# -----------------------\n",
    "# Config\n",
    "# -----------------------\n",
    "SEED = 42\n",
    "DATA_FILE  = \"arcene_combined_encoded.csv\"\n",
    "TARGET_COL = \"Label\"\n",
    "\n",
    "N_TRIALS = 150\n",
    "GPU_ID = 6  # change if needed\n",
    "\n",
    "# If you want to force which GPU is visible for kmeans_gpu + tabpfn:\n",
    "if \"torch\" not in sys.modules:\n",
    "    os.environ[\"CUDA_VISIBLE_DEVICES\"] = str(GPU_ID)\n",
    "\n",
    "# -----------------------\n",
    "# Utils\n",
    "# -----------------------\n",
    "def seed_everything(seed: int = 42):\n",
    "    random.seed(seed)\n",
    "    np.random.seed(seed)\n",
    "    torch.manual_seed(seed)\n",
    "    if torch.cuda.is_available():\n",
    "        torch.cuda.manual_seed_all(seed)\n",
    "    os.environ[\"PYTHONHASHSEED\"] = str(seed)\n",
    "\n",
    "def cleanup_cuda():\n",
    "    gc.collect()\n",
    "    if torch.cuda.is_available():\n",
    "        try:\n",
    "            torch.cuda.synchronize()\n",
    "        except Exception:\n",
    "            pass\n",
    "        torch.cuda.empty_cache()\n",
    "\n",
    "def ensure_multiclass_contiguous(y: np.ndarray):\n",
    "    y = np.asarray(y).reshape(-1)\n",
    "    uniq = np.unique(y)\n",
    "    uniq_sorted = np.sort(uniq)\n",
    "    class_map = {orig: i for i, orig in enumerate(uniq_sorted.tolist())}\n",
    "    y_enc = np.vectorize(class_map.get, otypes=[np.int64])(y).astype(np.int64)\n",
    "    return y_enc, class_map, int(len(class_map))\n",
    "\n",
    "def compute_deltas_adjacent_corr(X_tr: np.ndarray, Pi_star: list[int], eps: float = 1e-12) -> torch.Tensor:\n",
    "    \"\"\"\n",
    "    delta[t] = 1 - |corr(feature_{Pi[t]}, feature_{Pi[t+1]})|\n",
    "    Returns torch.Tensor shape (m-1,) on CPU.\n",
    "    \"\"\"\n",
    "    X = torch.from_numpy(X_tr).float()  # CPU\n",
    "    perm = torch.tensor(Pi_star, dtype=torch.long)\n",
    "    Xp = X[:, perm]\n",
    "    Xc = Xp - Xp.mean(dim=0, keepdim=True)\n",
    "    std = Xc.std(dim=0, unbiased=False, keepdim=True).clamp_min(eps)\n",
    "    Z = Xc / std\n",
    "    corr = (Z[:, :-1] * Z[:, 1:]).mean(dim=0)\n",
    "    return (1.0 - corr.abs()).cpu()\n",
    "\n",
    "# -----------------------\n",
    "# Load data\n",
    "# -----------------------\n",
    "seed_everything(SEED)\n",
    "df = pd.read_csv(DATA_FILE)\n",
    "\n",
    "y_raw = df[TARGET_COL].to_numpy()\n",
    "X_df  = df.drop(columns=[TARGET_COL])\n",
    "\n",
    "y, class_map, NUM_CLASSES = ensure_multiclass_contiguous(y_raw)\n",
    "\n",
    "# Standardize globally \n",
    "scaler = StandardScaler()\n",
    "X_scaled = scaler.fit_transform(X_df.values).astype(np.float32, copy=False)\n",
    "\n",
    "X_all = np.asarray(X_scaled, dtype=np.float32, order=\"C\")\n",
    "y_all = np.asarray(y, dtype=np.int64)\n",
    "\n",
    "print(f\"[DATA] {DATA_FILE} | X={X_all.shape} | C={NUM_CLASSES} | map={class_map}\")\n",
    "print(\"[GPU ] cuda=\", torch.cuda.is_available(), \"| visible_gpus=\", torch.cuda.device_count())\n",
    "\n",
    "# 5x5 CV\n",
    "rkf = RepeatedStratifiedKFold(n_splits=5, n_repeats=5, random_state=SEED)\n",
    "\n",
    "# Devices\n",
    "NSC_DEVICE = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
    "TABPFN_DEVICE = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
    "\n",
    "# -----------------------\n",
    "# Optuna objective\n",
    "# -----------------------\n",
    "def objective(trial: optuna.Trial):\n",
    "    seed_everything(SEED)\n",
    "\n",
    "    # --------- Tune GO-LR (once per trial) ----------\n",
    "    go_metric = trial.suggest_categorical(\n",
    "        \"go_metric\", [\"correlation\", \"cosine\", \"manhattan\", \"euclidean\", \"kl_divergence\"]\n",
    "    )\n",
    "    go_k = trial.suggest_int(\"go_num_clusters\", 4, 12)\n",
    "    go_refine_passes = trial.suggest_int(\"go_refine_passes\", 1, 3)\n",
    "    go_direction = trial.suggest_categorical(\"go_direction_select\", [True, False])\n",
    "\n",
    "    \n",
    "    # We try use_cpu_kmeans=False first, then fallback True if needed.\n",
    "\n",
    "    # --------- Tune NSC ----------\n",
    "    nsc_seg = trial.suggest_categorical(\"nsc_segmentation\", [\"uniform\", \"largest_jump\", \"equal_mass\"])\n",
    "    nsc_m_rule = trial.suggest_categorical(\"nsc_m_rule\", [\"default\", \"idf\", \"gamma\"])\n",
    "    nsc_tau = trial.suggest_categorical(\"nsc_tau\", [0.95, 0.99, 0.9975])\n",
    "    nsc_gamma = trial.suggest_float(\"nsc_gamma\", 1.0, 3.0)\n",
    "    nsc_beta = trial.suggest_float(\"nsc_beta\", 0.0, 0.9)\n",
    "    nsc_Mmin = trial.suggest_categorical(\"nsc_Mmin\", [16, 32, 48, 64])\n",
    "    nsc_Mmax = trial.suggest_categorical(\"nsc_Mmax\", [128, 256, 384, 512, 640])\n",
    "    nsc_lmin = trial.suggest_categorical(\"nsc_lmin\", [8, 12, 16])\n",
    "    assume_standardized = trial.suggest_categorical(\"assume_standardized\", [True, False])\n",
    "\n",
    "    # TabPFN seed (head is frozen; but its internal rng can matter)\n",
    "    tabpfn_seed = trial.suggest_categorical(\"tabpfn_seed\", [0, 1, 2, 3, 4, 42])\n",
    "\n",
    "    # ---- GO-LR ONCE per trial ----\n",
    "    go = GraphFeatureOrdering(\n",
    "        num_clusters=int(go_k),\n",
    "        metric=go_metric,\n",
    "        refine=True,\n",
    "        direction_select=bool(go_direction),\n",
    "        refine_passes=int(go_refine_passes),\n",
    "    )\n",
    "\n",
    "    try:\n",
    "        # Prefer GPU kmeans\n",
    "        Pi_star, _, _, _ = go.fit(X_all, seed=SEED, deterministic=True, use_cpu_kmeans=False)\n",
    "    except RuntimeError as e:\n",
    "        # Fallback to CPU kmeans if GPU path OOMs/fails\n",
    "        cleanup_cuda()\n",
    "        try:\n",
    "            Pi_star, _, _, _ = go.fit(X_all, seed=SEED, deterministic=True, use_cpu_kmeans=True)\n",
    "        except Exception:\n",
    "            raise optuna.TrialPruned(f\"GO-LR failed (metric={go_metric})\")\n",
    "\n",
    "    # ---- 5x5 CV: NSC+TabPFN per fold using fixed Pi_star ----\n",
    "    head_cfg = TabPFN25Config(\n",
    "        task_type=\"binary\",\n",
    "        num_classes=int(NUM_CLASSES),\n",
    "        device=TABPFN_DEVICE,\n",
    "        random_state=int(tabpfn_seed),\n",
    "    )\n",
    "\n",
    "    accs = []\n",
    "    for fold_id, (tr_idx, va_idx) in enumerate(rkf.split(X_all, y_all), start=1):\n",
    "        X_tr = X_all[tr_idx]\n",
    "        y_tr = y_all[tr_idx]\n",
    "        X_va = X_all[va_idx]\n",
    "        y_va = y_all[va_idx]\n",
    "\n",
    "        # NSC config on TRAIN only\n",
    "        nsc = PIDFSegPCA(\n",
    "            segmentation=nsc_seg,\n",
    "            l_min=int(nsc_lmin),\n",
    "            m_rule=nsc_m_rule,\n",
    "            gamma=float(nsc_gamma),\n",
    "            beta=float(nsc_beta),\n",
    "            tau=float(nsc_tau),\n",
    "            M_min=int(nsc_Mmin),\n",
    "            M_max=int(nsc_Mmax),\n",
    "            assume_standardized=bool(assume_standardized),\n",
    "            device=NSC_DEVICE,\n",
    "        )\n",
    "\n",
    "        deltas = None if nsc_seg == \"uniform\" else compute_deltas_adjacent_corr(X_tr, Pi_star)\n",
    "\n",
    "        X_tr_t = torch.from_numpy(X_tr)\n",
    "        nsc.configure(Pi_star=Pi_star, X_train=X_tr_t, tau=float(nsc_tau), deltas=deltas)\n",
    "\n",
    "        Z_tr = nsc.compress(X_tr_t, mode=\"flatten\").cpu().numpy()\n",
    "        Z_va = nsc.compress(torch.from_numpy(X_va), mode=\"flatten\").cpu().numpy()\n",
    "\n",
    "        # TabPFN fit/eval\n",
    "        head = TabPFN25Head(head_cfg)\n",
    "        head.fit(Z_tr, y_tr)\n",
    "\n",
    "        P = head.predict_proba(Z_va)\n",
    "        pred = np.argmax(P, axis=1)\n",
    "        acc = float(accuracy_score(y_va, pred))\n",
    "        accs.append(acc)\n",
    "\n",
    "        # prune on running mean\n",
    "        trial.report(float(np.mean(accs)), step=fold_id)\n",
    "        if trial.should_prune():\n",
    "            cleanup_cuda()\n",
    "            raise optuna.TrialPruned()\n",
    "\n",
    "        cleanup_cuda()\n",
    "\n",
    "    mean_acc = float(np.mean(accs))\n",
    "    std_acc  = float(np.std(accs, ddof=1))\n",
    "    trial.set_user_attr(\"mean_acc\", mean_acc)\n",
    "    trial.set_user_attr(\"std_acc\", std_acc)\n",
    "    return mean_acc\n",
    "\n",
    "# -----------------------\n",
    "# Run Optuna\n",
    "# -----------------------\n",
    "sampler = optuna.samplers.TPESampler(seed=SEED, multivariate=True, group=True)\n",
    "pruner  = optuna.pruners.MedianPruner(n_warmup_steps=10)  # warmup because 25 folds\n",
    "\n",
    "study = optuna.create_study(direction=\"maximize\", sampler=sampler, pruner=pruner)\n",
    "study.optimize(objective, n_trials=N_TRIALS, show_progress_bar=True, gc_after_trial=True, n_jobs=1)\n",
    "\n",
    "best = study.best_trial\n",
    "print(\"\\n================ BEST TRIAL ================\")\n",
    "print(f\"mean_acc ± std_acc = {best.user_attrs.get('mean_acc', best.value):.6f} ± {best.user_attrs.get('std_acc', float('nan')):.6f}\")\n",
    "print(\"\\nBest hyperparameters:\")\n",
    "for k, v in best.params.items():\n",
    "    print(f\"  {k}: {v}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9a4fb0ee-8e3a-4375-8197-76f07fe2e56f",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
