{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "766d736f-01c4-4fa5-b6d6-e90fff890b20",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[I 2026-01-21 20:08:17,456] A new study created in memory with name: no-name-5d6d71fa-de0b-46d6-a0fb-0e3d0033fc0a\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[DATA] TOX171_combined_encoded.csv | X=(171, 5748) | C=4 | map={0: 0, 1: 1, 2: 2, 3: 3}\n",
      "[GPU ] cuda= True | visible_gpus= 8\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "60db10293b3641ae9dcf7d121741af49",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "  0%|          | 0/150 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[I 2026-01-21 20:10:09,797] Trial 0 finished with value: 0.8947226890756304 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 1.8638900372842315, 'nsc_beta': 0.26210622617823776, 'nsc_Mmin': 16, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:12:08,702] Trial 1 finished with value: 0.8550924369747898 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 9, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 1.0904545778210761, 'nsc_beta': 0.2927972976869379, 'nsc_Mmin': 48, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': False, 'tabpfn_seed': 2}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:14:33,552] Trial 2 finished with value: 0.8115294117647057 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 6, 'go_refine_passes': 3, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 1.0508382534881904, 'nsc_beta': 0.09710228429397401, 'nsc_Mmin': 32, 'nsc_Mmax': 128, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:17:23,051] Trial 3 finished with value: 0.8139831932773108 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 7, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 1.727259204758588, 'nsc_beta': 0.8746038744488647, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:20:08,272] Trial 4 finished with value: 0.8770756302521009 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 11, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.873459977473469, 'nsc_beta': 0.12376884973139393, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:22:04,428] Trial 5 finished with value: 0.8926050420168068 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.2992657980944293, 'nsc_beta': 0.7643010694447602, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:25:00,137] Trial 6 finished with value: 0.7964369747899158 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 12, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.99, 'nsc_gamma': 2.14012234017873, 'nsc_beta': 0.08745884439369168, 'nsc_Mmin': 32, 'nsc_Mmax': 128, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 2}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:26:11,205] Trial 7 pruned. \n",
      "[I 2026-01-21 20:28:15,049] Trial 8 pruned. \n",
      "[I 2026-01-21 20:31:07,734] Trial 9 finished with value: 0.8420504201680673 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 7, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 2.6289369651778713, 'nsc_beta': 0.25366929729605997, 'nsc_Mmin': 64, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 1}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:33:08,121] Trial 10 finished with value: 0.8149915966386555 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 2.0934366930214616, 'nsc_beta': 0.48937648530829453, 'nsc_Mmin': 16, 'nsc_Mmax': 128, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:34:12,478] Trial 11 pruned. \n",
      "[I 2026-01-21 20:36:15,779] Trial 12 finished with value: 0.8653781512605042 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 1.766038341146983, 'nsc_beta': 0.09408561823503278, 'nsc_Mmin': 32, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 2}. Best is trial 0 with value: 0.8947226890756304.\n",
      "[I 2026-01-21 20:38:28,426] Trial 13 finished with value: 0.9029915966386555 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.7176471805162494, 'nsc_beta': 0.6746391325074964, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 13 with value: 0.9029915966386555.\n",
      "[I 2026-01-21 20:40:57,407] Trial 14 finished with value: 0.8654117647058824 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.844727413168471, 'nsc_beta': 0.7767038516175356, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 13 with value: 0.9029915966386555.\n",
      "[I 2026-01-21 20:41:47,303] Trial 15 pruned. \n",
      "[I 2026-01-21 20:43:48,793] Trial 16 finished with value: 0.8641680672268905 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 1.8107082910184444, 'nsc_beta': 0.11198783224673176, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 13 with value: 0.9029915966386555.\n",
      "[I 2026-01-21 20:45:28,923] Trial 17 pruned. \n",
      "[I 2026-01-21 20:46:42,073] Trial 18 pruned. \n",
      "[I 2026-01-21 20:49:31,429] Trial 19 finished with value: 0.8818823529411765 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 10, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.7546623214033623, 'nsc_beta': 0.4129891454579623, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 2}. Best is trial 13 with value: 0.9029915966386555.\n",
      "[I 2026-01-21 20:50:58,216] Trial 20 pruned. \n",
      "[I 2026-01-21 20:53:13,300] Trial 21 finished with value: 0.878453781512605 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.538543937969017, 'nsc_beta': 0.5318047089197158, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 13 with value: 0.9029915966386555.\n",
      "[I 2026-01-21 20:55:21,841] Trial 22 finished with value: 0.8713277310924369 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'idf', 'nsc_tau': 0.95, 'nsc_gamma': 1.7905305019396747, 'nsc_beta': 0.8409826805723346, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 13 with value: 0.9029915966386555.\n",
      "[I 2026-01-21 20:57:21,934] Trial 23 finished with value: 0.9078319327731093 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.673812126339601, 'nsc_beta': 0.6220534070552344, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 20:59:29,031] Trial 24 finished with value: 0.8923025210084033 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 8, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.577743936783575, 'nsc_beta': 0.479102221397426, 'nsc_Mmin': 48, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:01:46,000] Trial 25 finished with value: 0.8959327731092437 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 8, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.4297574122631476, 'nsc_beta': 0.7253037400108616, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:03:51,877] Trial 26 finished with value: 0.9005378151260505 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.602516506499876, 'nsc_beta': 0.7044386920681273, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:04:50,565] Trial 27 pruned. \n",
      "[I 2026-01-21 21:06:38,956] Trial 28 finished with value: 0.8783193277310924 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.5780971010501417, 'nsc_beta': 0.5345506716056239, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:07:32,617] Trial 29 pruned. \n",
      "[I 2026-01-21 21:09:35,997] Trial 30 finished with value: 0.862890756302521 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.46851902245609, 'nsc_beta': 0.44503782265417713, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:11:04,066] Trial 31 pruned. \n",
      "[I 2026-01-21 21:12:03,200] Trial 32 pruned. \n",
      "[I 2026-01-21 21:14:27,012] Trial 33 finished with value: 0.8887058823529412 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 8, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.9888967120583256, 'nsc_beta': 0.7050557284336738, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:17:17,463] Trial 34 finished with value: 0.8915294117647059 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 12, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.5318697404308854, 'nsc_beta': 0.825470643310148, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:18:55,700] Trial 35 finished with value: 0.8595966386554622 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.675944090791732, 'nsc_beta': 0.7957734524856026, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:21:02,260] Trial 36 finished with value: 0.8890420168067226 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 8, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.1396431093965718, 'nsc_beta': 0.6523681720730572, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:21:56,218] Trial 37 pruned. \n",
      "[I 2026-01-21 21:23:47,790] Trial 38 finished with value: 0.9006050420168067 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.907633859499004, 'nsc_beta': 0.7375719278254462, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 3}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:25:35,027] Trial 39 finished with value: 0.892436974789916 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.8356853366206147, 'nsc_beta': 0.776718403296924, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:27:19,967] Trial 40 finished with value: 0.8969747899159662 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.7499685008760593, 'nsc_beta': 0.682713573955733, 'nsc_Mmin': 48, 'nsc_Mmax': 256, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:29:27,776] Trial 41 finished with value: 0.8632605042016808 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 5, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.321553249601247, 'nsc_beta': 0.6921647025648601, 'nsc_Mmin': 48, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:31:13,393] Trial 42 finished with value: 0.8922689075630252 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.790552748957567, 'nsc_beta': 0.8857137485689016, 'nsc_Mmin': 64, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 3}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:31:55,836] Trial 43 pruned. \n",
      "[I 2026-01-21 21:33:24,603] Trial 44 finished with value: 0.858252100840336 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.6721329266789997, 'nsc_beta': 0.698810755555912, 'nsc_Mmin': 48, 'nsc_Mmax': 256, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:34:11,230] Trial 45 pruned. \n",
      "[I 2026-01-21 21:35:59,528] Trial 46 finished with value: 0.8992605042016806 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 8, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.7410881951966215, 'nsc_beta': 0.746067805714952, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 3}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:37:48,340] Trial 47 finished with value: 0.9027226890756301 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.4824149689947173, 'nsc_beta': 0.8858318608053313, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 3}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:39:32,218] Trial 48 finished with value: 0.8982184873949579 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 9, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.7350228228998166, 'nsc_beta': 0.8813960293250722, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 8, 'assume_standardized': False, 'tabpfn_seed': 3}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:40:13,595] Trial 49 pruned. \n",
      "[I 2026-01-21 21:41:26,637] Trial 50 finished with value: 0.8547899159663865 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 2.7933759120940542, 'nsc_beta': 0.4284184889088658, 'nsc_Mmin': 48, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:42:42,350] Trial 51 pruned. \n",
      "[I 2026-01-21 21:45:02,811] Trial 52 finished with value: 0.907764705882353 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 10, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.7969571722757185, 'nsc_beta': 0.8941096785349187, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 23 with value: 0.9078319327731093.\n",
      "[I 2026-01-21 21:47:40,787] Trial 53 finished with value: 0.9332773109243697 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 10, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.855967165618566, 'nsc_beta': 0.6509255216337713, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 21:50:09,971] Trial 54 finished with value: 0.8678655462184873 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 11, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.714523619186744, 'nsc_beta': 0.8044237439767324, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 21:51:38,396] Trial 55 pruned. \n",
      "[I 2026-01-21 21:53:02,552] Trial 56 pruned. \n",
      "[I 2026-01-21 21:54:56,006] Trial 57 finished with value: 0.9017478991596637 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 8, 'go_refine_passes': 3, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.704239984153966, 'nsc_beta': 0.6095120936535545, 'nsc_Mmin': 32, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 21:57:04,796] Trial 58 finished with value: 0.8760672268907561 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 8, 'go_refine_passes': 3, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.7107654808206423, 'nsc_beta': 0.5798819868972421, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 21:58:43,461] Trial 59 finished with value: 0.8805714285714284 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 5, 'go_refine_passes': 3, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 2.3259894074851877, 'nsc_beta': 0.8445035499620709, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:00:14,003] Trial 60 pruned. \n",
      "[I 2026-01-21 22:02:35,062] Trial 61 finished with value: 0.8652436974789914 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 10, 'go_refine_passes': 3, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.8880712484083424, 'nsc_beta': 0.4302102191967355, 'nsc_Mmin': 32, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:04:44,380] Trial 62 finished with value: 0.874689075630252 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 10, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.4000513109002073, 'nsc_beta': 0.7399380069544517, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:06:23,187] Trial 63 pruned. \n",
      "[I 2026-01-21 22:08:01,596] Trial 64 finished with value: 0.8745882352941176 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 9, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.550067905408057, 'nsc_beta': 0.7911873209967175, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 3}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:10:37,193] Trial 65 finished with value: 0.9017478991596637 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 8, 'go_refine_passes': 3, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.313482532346338, 'nsc_beta': 0.5873540412799727, 'nsc_Mmin': 32, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:13:41,244] Trial 66 finished with value: 0.8984201680672268 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 10, 'go_refine_passes': 3, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.99, 'nsc_gamma': 2.4942361046816437, 'nsc_beta': 0.36634572322050085, 'nsc_Mmin': 48, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:15:44,526] Trial 67 pruned. \n",
      "[I 2026-01-21 22:17:48,418] Trial 68 pruned. \n",
      "[I 2026-01-21 22:19:37,013] Trial 69 finished with value: 0.8774453781512603 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.99, 'nsc_gamma': 2.231621108782672, 'nsc_beta': 0.7143476063929766, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:22:41,527] Trial 70 finished with value: 0.8806050420168067 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 3, 'go_direction_select': False, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.4480862273488677, 'nsc_beta': 0.4952112775502535, 'nsc_Mmin': 64, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:24:55,246] Trial 71 finished with value: 0.8889411764705882 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 2, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.4937783762823766, 'nsc_beta': 0.8650461597507765, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': False, 'tabpfn_seed': 1}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:27:34,169] Trial 72 finished with value: 0.8901512605042017 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 12, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.7071123462077322, 'nsc_beta': 0.46725666078878114, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:29:26,645] Trial 73 finished with value: 0.8737478991596638 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.8256487763982436, 'nsc_beta': 0.5739410998043963, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:31:10,477] Trial 74 pruned. \n",
      "[I 2026-01-21 22:33:30,898] Trial 75 finished with value: 0.9135126050420166 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 10, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.6014974580071883, 'nsc_beta': 0.8355047589939268, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:35:52,045] Trial 76 finished with value: 0.9031260504201681 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 8, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.4399084756000886, 'nsc_beta': 0.8579198089435871, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:38:25,141] Trial 77 finished with value: 0.8643025210084032 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'idf', 'nsc_tau': 0.99, 'nsc_gamma': 2.8829157068650715, 'nsc_beta': 0.8450284829670339, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:39:58,661] Trial 78 pruned. \n",
      "[I 2026-01-21 22:42:09,333] Trial 79 finished with value: 0.8960672268907564 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 6, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.387470068916868, 'nsc_beta': 0.7851582945587211, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 1}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:44:33,946] Trial 80 pruned. \n",
      "[I 2026-01-21 22:46:37,671] Trial 81 pruned. \n",
      "[I 2026-01-21 22:48:28,617] Trial 82 pruned. \n",
      "[I 2026-01-21 22:51:09,380] Trial 83 finished with value: 0.8933781512605043 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 10, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.7479034301825433, 'nsc_beta': 0.7849930093385542, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 1}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:54:17,460] Trial 84 finished with value: 0.8808067226890757 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 10, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.95, 'nsc_gamma': 2.5426874388494056, 'nsc_beta': 0.6883764109109172, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 22:58:19,805] Trial 85 finished with value: 0.8865210084033612 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 11, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.901178371622854, 'nsc_beta': 0.844052512395602, 'nsc_Mmin': 64, 'nsc_Mmax': 512, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:02:14,015] Trial 86 finished with value: 0.8875630252100839 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.5321587763441706, 'nsc_beta': 0.6297373515022197, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:04:58,405] Trial 87 finished with value: 0.8831596638655462 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.7631844346661154, 'nsc_beta': 0.2506467086593754, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:08:43,314] Trial 88 finished with value: 0.905109243697479 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 7, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.3198398907595785, 'nsc_beta': 0.7536757853702656, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:12:41,331] Trial 89 finished with value: 0.904033613445378 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 8, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.4120427962412836, 'nsc_beta': 0.7117047215533013, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:15:42,816] Trial 90 finished with value: 0.9029243697478992 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 7, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 1.9519502563404765, 'nsc_beta': 0.6148326534820208, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:18:38,416] Trial 91 finished with value: 0.87381512605042 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 1.80775997311507, 'nsc_beta': 0.5458567611740739, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:21:52,544] Trial 92 finished with value: 0.885378151260504 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 6, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 1.8721109297293983, 'nsc_beta': 0.6576605854946567, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:25:52,887] Trial 93 finished with value: 0.8102857142857143 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 10, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.0997936190622193, 'nsc_beta': 0.7410641231216967, 'nsc_Mmin': 32, 'nsc_Mmax': 128, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:30:09,062] Trial 94 finished with value: 0.8772773109243698 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.99, 'nsc_gamma': 2.89556268540793, 'nsc_beta': 0.3986643695821348, 'nsc_Mmin': 32, 'nsc_Mmax': 256, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:32:43,678] Trial 95 pruned. \n",
      "[I 2026-01-21 23:36:59,348] Trial 96 finished with value: 0.9099159663865545 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 8, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.7626549940789342, 'nsc_beta': 0.8153480253771904, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:40:57,528] Trial 97 finished with value: 0.9123025210084034 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 7, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.5456459006626693, 'nsc_beta': 0.6698334305633025, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:44:00,155] Trial 98 pruned. \n",
      "[I 2026-01-21 23:47:37,211] Trial 99 finished with value: 0.8959663865546217 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 6, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.947717282644076, 'nsc_beta': 0.5815770545722658, 'nsc_Mmin': 32, 'nsc_Mmax': 512, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:50:24,566] Trial 100 pruned. \n",
      "[I 2026-01-21 23:53:37,929] Trial 101 pruned. \n",
      "[I 2026-01-21 23:57:26,753] Trial 102 finished with value: 0.8782857142857142 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 8, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.370737684119908, 'nsc_beta': 0.8964488794503515, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-21 23:59:43,132] Trial 103 pruned. \n",
      "[I 2026-01-22 00:03:47,309] Trial 104 finished with value: 0.8898823529411765 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.3818465446847172, 'nsc_beta': 0.8534395078700733, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:06:40,811] Trial 105 pruned. \n",
      "[I 2026-01-22 00:09:55,886] Trial 106 finished with value: 0.8819159663865546 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 5, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.762065238568275, 'nsc_beta': 0.7800288259840389, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 8, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:11:37,184] Trial 107 pruned. \n",
      "[I 2026-01-22 00:14:15,127] Trial 108 finished with value: 0.8890084033613445 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.274704457519279, 'nsc_beta': 0.5214631429734062, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:17:01,554] Trial 109 pruned. \n",
      "[I 2026-01-22 00:21:16,001] Trial 110 finished with value: 0.8854117647058825 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.0229465065415333, 'nsc_beta': 0.6136009777607894, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 3}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:23:42,715] Trial 111 finished with value: 0.8934789915966387 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 7, 'go_refine_passes': 2, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.744707728929166, 'nsc_beta': 0.6781754648737617, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:27:34,525] Trial 112 finished with value: 0.8785210084033613 and parameters: {'go_metric': 'correlation', 'go_num_clusters': 11, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.6078494936882732, 'nsc_beta': 0.46679906783944586, 'nsc_Mmin': 64, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:32:13,640] Trial 113 finished with value: 0.9054117647058824 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 10, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.656093720702383, 'nsc_beta': 0.7455255161169736, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 3}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:36:01,206] Trial 114 pruned. \n",
      "[I 2026-01-22 00:40:55,725] Trial 115 finished with value: 0.8621176470588234 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 11, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.721505702532294, 'nsc_beta': 0.7148846961716037, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:43:37,152] Trial 116 finished with value: 0.8769411764705882 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.755294426022555, 'nsc_beta': 0.6901693872681108, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:47:06,895] Trial 117 finished with value: 0.8842352941176469 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 6, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.95, 'nsc_gamma': 2.336038389760235, 'nsc_beta': 0.7149202544924009, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:50:41,090] Trial 118 finished with value: 0.8994957983193278 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 8, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.1566144101967533, 'nsc_beta': 0.8584690515011951, 'nsc_Mmin': 64, 'nsc_Mmax': 640, 'nsc_lmin': 12, 'assume_standardized': True, 'tabpfn_seed': 0}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:53:25,844] Trial 119 finished with value: 0.8665210084033613 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': False, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.593677607268083, 'nsc_beta': 0.516887627105026, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 00:56:37,035] Trial 120 pruned. \n",
      "[I 2026-01-22 00:59:13,240] Trial 121 finished with value: 0.8829915966386556 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'default', 'nsc_tau': 0.9975, 'nsc_gamma': 2.9499293765202004, 'nsc_beta': 0.6721385276648555, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:02:59,835] Trial 122 finished with value: 0.9086050420168067 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 7, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.6943863165145667, 'nsc_beta': 0.7098299202011413, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:06:50,548] Trial 123 finished with value: 0.9027899159663865 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 7, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.5601094353737164, 'nsc_beta': 0.4888396885203854, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:08:27,126] Trial 124 pruned. \n",
      "[I 2026-01-22 01:11:19,046] Trial 125 finished with value: 0.8995630252100839 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 4, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.257141573632588, 'nsc_beta': 0.36118747865265977, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:14:57,604] Trial 126 pruned. \n",
      "[I 2026-01-22 01:18:53,963] Trial 127 pruned. \n",
      "[I 2026-01-22 01:22:10,914] Trial 128 finished with value: 0.8596974789915964 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 6, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'idf', 'nsc_tau': 0.9975, 'nsc_gamma': 2.436002765464894, 'nsc_beta': 0.6620903153405385, 'nsc_Mmin': 32, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:24:21,935] Trial 129 pruned. \n",
      "[I 2026-01-22 01:25:33,249] Trial 130 pruned. \n",
      "[I 2026-01-22 01:28:35,923] Trial 131 finished with value: 0.8912941176470587 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 6, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.03145512114067, 'nsc_beta': 0.49217421192958977, 'nsc_Mmin': 16, 'nsc_Mmax': 384, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:29:44,681] Trial 132 pruned. \n",
      "[I 2026-01-22 01:33:26,751] Trial 133 finished with value: 0.8980840336134454 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 7, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.9213061139088654, 'nsc_beta': 0.8686114683510391, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:37:11,743] Trial 134 finished with value: 0.9029915966386554 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 5, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.991432703465412, 'nsc_beta': 0.6211993464515677, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:42:04,215] Trial 135 finished with value: 0.8888739495798319 and parameters: {'go_metric': 'manhattan', 'go_num_clusters': 9, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.696804146020127, 'nsc_beta': 0.8122336841003861, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:46:23,241] Trial 136 finished with value: 0.8665882352941177 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 9, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.911431289622103, 'nsc_beta': 0.7695266033936973, 'nsc_Mmin': 48, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:49:27,726] Trial 137 finished with value: 0.8781848739495797 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.334690391704952, 'nsc_beta': 0.7151618004184955, 'nsc_Mmin': 32, 'nsc_Mmax': 384, 'nsc_lmin': 8, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:52:29,085] Trial 138 pruned. \n",
      "[I 2026-01-22 01:56:50,042] Trial 139 finished with value: 0.8233277310924368 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 10, 'go_refine_passes': 2, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.4067648813515694, 'nsc_beta': 0.7277485645697168, 'nsc_Mmin': 32, 'nsc_Mmax': 256, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 4}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 01:59:47,935] Trial 140 finished with value: 0.9087731092436975 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 7, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.540522306641088, 'nsc_beta': 0.7055126593717237, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 02:03:17,488] Trial 141 finished with value: 0.8747899159663863 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 6, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'largest_jump', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.9637792985498153, 'nsc_beta': 0.5269133795686786, 'nsc_Mmin': 48, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': True, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 02:05:10,501] Trial 142 pruned. \n",
      "[I 2026-01-22 02:07:43,301] Trial 143 finished with value: 0.8782184873949578 and parameters: {'go_metric': 'cosine', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.9216339913602796, 'nsc_beta': 0.6353637678157174, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 1}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 02:09:18,190] Trial 144 pruned. \n",
      "[I 2026-01-22 02:11:01,416] Trial 145 pruned. \n",
      "[I 2026-01-22 02:13:53,998] Trial 146 pruned. \n",
      "[I 2026-01-22 02:16:40,012] Trial 147 finished with value: 0.8877647058823528 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 5, 'go_refine_passes': 2, 'go_direction_select': False, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.176458720686559, 'nsc_beta': 0.7391173784283075, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 42}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 02:19:04,317] Trial 148 finished with value: 0.898218487394958 and parameters: {'go_metric': 'euclidean', 'go_num_clusters': 6, 'go_refine_passes': 1, 'go_direction_select': True, 'nsc_segmentation': 'uniform', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.9975, 'nsc_gamma': 2.3513599163478314, 'nsc_beta': 0.5608000373243313, 'nsc_Mmin': 48, 'nsc_Mmax': 384, 'nsc_lmin': 12, 'assume_standardized': False, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "[I 2026-01-22 02:22:13,733] Trial 149 finished with value: 0.8959327731092437 and parameters: {'go_metric': 'kl_divergence', 'go_num_clusters': 5, 'go_refine_passes': 3, 'go_direction_select': True, 'nsc_segmentation': 'equal_mass', 'nsc_m_rule': 'gamma', 'nsc_tau': 0.99, 'nsc_gamma': 2.7032388086601826, 'nsc_beta': 0.8227108356249737, 'nsc_Mmin': 16, 'nsc_Mmax': 640, 'nsc_lmin': 16, 'assume_standardized': False, 'tabpfn_seed': 2}. Best is trial 53 with value: 0.9332773109243697.\n",
      "\n",
      "================ BEST TRIAL ================\n",
      "mean_acc ± std_acc = 0.933277 ± 0.047434\n",
      "\n",
      "Best hyperparameters:\n",
      "  go_metric: kl_divergence\n",
      "  go_num_clusters: 10\n",
      "  go_refine_passes: 3\n",
      "  go_direction_select: True\n",
      "  nsc_segmentation: equal_mass\n",
      "  nsc_m_rule: gamma\n",
      "  nsc_tau: 0.99\n",
      "  nsc_gamma: 2.855967165618566\n",
      "  nsc_beta: 0.6509255216337713\n",
      "  nsc_Mmin: 32\n",
      "  nsc_Mmax: 384\n",
      "  nsc_lmin: 16\n",
      "  assume_standardized: False\n",
      "  tabpfn_seed: 4\n"
     ]
    }
   ],
   "source": [
    "# ============================================================\n",
    "# ONE CELL (TOX171, multiclass): OPTUNA with GO-LR ONCE per trial \n",
    "# Per trial:\n",
    "#   1) GO-LR fit on FULL X -> Pi_star (fixed for all folds in that trial)\n",
    "#   2) 5x5 CV folds:\n",
    "#        NSC configure on train only (uses fixed Pi_star)\n",
    "#        compress train/val\n",
    "#        TabPFN fit on train, eval on val\n",
    "# ============================================================\n",
    "\n",
    "import os, sys, gc, random, warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "\n",
    "os.environ.setdefault(\"PYTORCH_CUDA_ALLOC_CONF\", \"expandable_segments:True\")\n",
    "os.environ.setdefault(\"CUDA_DEVICE_ORDER\", \"PCI_BUS_ID\")\n",
    "\n",
    "import optuna\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import torch\n",
    "\n",
    "from sklearn.model_selection import RepeatedStratifiedKFold\n",
    "from sklearn.preprocessing import StandardScaler\n",
    "from sklearn.metrics import accuracy_score\n",
    "from tqdm import tqdm\n",
    "\n",
    "#   GraphFeatureOrdering, pidf_segpca, TabPFN25Head, TabPFN25Config\n",
    "from gotabpfn import GraphFeatureOrdering, pidf_segpca, TabPFN25Head, TabPFN25Config\n",
    "PIDFSegPCA = pidf_segpca  # alias to match your earlier naming\n",
    "\n",
    "# -----------------------\n",
    "# Config\n",
    "# -----------------------\n",
    "SEED = 42\n",
    "DATA_FILE  = \"TOX171_combined_encoded.csv\"\n",
    "TARGET_COL = \"Label\"\n",
    "\n",
    "N_TRIALS = 150\n",
    "GPU_ID = 7  # change if needed\n",
    "\n",
    "# If you want to force which GPU is visible for kmeans_gpu + tabpfn:\n",
    "if \"torch\" not in sys.modules:\n",
    "    os.environ[\"CUDA_VISIBLE_DEVICES\"] = str(GPU_ID)\n",
    "\n",
    "# -----------------------\n",
    "# Utils\n",
    "# -----------------------\n",
    "def seed_everything(seed: int = 42):\n",
    "    random.seed(seed)\n",
    "    np.random.seed(seed)\n",
    "    torch.manual_seed(seed)\n",
    "    if torch.cuda.is_available():\n",
    "        torch.cuda.manual_seed_all(seed)\n",
    "    os.environ[\"PYTHONHASHSEED\"] = str(seed)\n",
    "\n",
    "def cleanup_cuda():\n",
    "    gc.collect()\n",
    "    if torch.cuda.is_available():\n",
    "        try:\n",
    "            torch.cuda.synchronize()\n",
    "        except Exception:\n",
    "            pass\n",
    "        torch.cuda.empty_cache()\n",
    "\n",
    "def ensure_multiclass_contiguous(y: np.ndarray):\n",
    "    y = np.asarray(y).reshape(-1)\n",
    "    uniq = np.unique(y)\n",
    "    uniq_sorted = np.sort(uniq)\n",
    "    class_map = {orig: i for i, orig in enumerate(uniq_sorted.tolist())}\n",
    "    y_enc = np.vectorize(class_map.get, otypes=[np.int64])(y).astype(np.int64)\n",
    "    return y_enc, class_map, int(len(class_map))\n",
    "\n",
    "def compute_deltas_adjacent_corr(X_tr: np.ndarray, Pi_star: list[int], eps: float = 1e-12) -> torch.Tensor:\n",
    "    \"\"\"\n",
    "    delta[t] = 1 - |corr(feature_{Pi[t]}, feature_{Pi[t+1]})|\n",
    "    Returns torch.Tensor shape (m-1,) on CPU.\n",
    "    \"\"\"\n",
    "    X = torch.from_numpy(X_tr).float()  # CPU\n",
    "    perm = torch.tensor(Pi_star, dtype=torch.long)\n",
    "    Xp = X[:, perm]\n",
    "    Xc = Xp - Xp.mean(dim=0, keepdim=True)\n",
    "    std = Xc.std(dim=0, unbiased=False, keepdim=True).clamp_min(eps)\n",
    "    Z = Xc / std\n",
    "    corr = (Z[:, :-1] * Z[:, 1:]).mean(dim=0)\n",
    "    return (1.0 - corr.abs()).cpu()\n",
    "\n",
    "# -----------------------\n",
    "# Load data\n",
    "# -----------------------\n",
    "seed_everything(SEED)\n",
    "df = pd.read_csv(DATA_FILE)\n",
    "\n",
    "y_raw = df[TARGET_COL].to_numpy()\n",
    "X_df  = df.drop(columns=[TARGET_COL])\n",
    "\n",
    "y, class_map, NUM_CLASSES = ensure_multiclass_contiguous(y_raw)\n",
    "\n",
    "# Standardize globally (leakage OK in your workflow)\n",
    "scaler = StandardScaler()\n",
    "X_scaled = scaler.fit_transform(X_df.values).astype(np.float32, copy=False)\n",
    "\n",
    "X_all = np.asarray(X_scaled, dtype=np.float32, order=\"C\")\n",
    "y_all = np.asarray(y, dtype=np.int64)\n",
    "\n",
    "print(f\"[DATA] {DATA_FILE} | X={X_all.shape} | C={NUM_CLASSES} | map={class_map}\")\n",
    "print(\"[GPU ] cuda=\", torch.cuda.is_available(), \"| visible_gpus=\", torch.cuda.device_count())\n",
    "\n",
    "# 5x5 CV\n",
    "rkf = RepeatedStratifiedKFold(n_splits=5, n_repeats=5, random_state=SEED)\n",
    "\n",
    "# Devices\n",
    "NSC_DEVICE = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
    "TABPFN_DEVICE = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
    "\n",
    "# -----------------------\n",
    "# Optuna objective\n",
    "# -----------------------\n",
    "def objective(trial: optuna.Trial):\n",
    "    seed_everything(SEED)\n",
    "\n",
    "    # --------- Tune GO-LR (once per trial) ----------\n",
    "    go_metric = trial.suggest_categorical(\n",
    "        \"go_metric\", [\"correlation\", \"cosine\", \"manhattan\", \"euclidean\", \"kl_divergence\"]\n",
    "    )\n",
    "    go_k = trial.suggest_int(\"go_num_clusters\", 4, 12)\n",
    "    go_refine_passes = trial.suggest_int(\"go_refine_passes\", 1, 3)\n",
    "    go_direction = trial.suggest_categorical(\"go_direction_select\", [True, False])\n",
    "\n",
    "    # IMPORTANT: prefer GPU KMeans first; CPU only as fallback\n",
    "    # So we DO NOT tune go_use_cpu_kmeans here.\n",
    "    # We try use_cpu_kmeans=False first, then fallback True if needed.\n",
    "\n",
    "    # --------- Tune NSC ----------\n",
    "    nsc_seg = trial.suggest_categorical(\"nsc_segmentation\", [\"uniform\", \"largest_jump\", \"equal_mass\"])\n",
    "    nsc_m_rule = trial.suggest_categorical(\"nsc_m_rule\", [\"default\", \"idf\", \"gamma\"])\n",
    "    nsc_tau = trial.suggest_categorical(\"nsc_tau\", [0.95, 0.99, 0.9975])\n",
    "    nsc_gamma = trial.suggest_float(\"nsc_gamma\", 1.0, 3.0)\n",
    "    nsc_beta = trial.suggest_float(\"nsc_beta\", 0.0, 0.9)\n",
    "    nsc_Mmin = trial.suggest_categorical(\"nsc_Mmin\", [16, 32, 48, 64])\n",
    "    nsc_Mmax = trial.suggest_categorical(\"nsc_Mmax\", [128, 256, 384, 512, 640])\n",
    "    nsc_lmin = trial.suggest_categorical(\"nsc_lmin\", [8, 12, 16])\n",
    "    assume_standardized = trial.suggest_categorical(\"assume_standardized\", [True, False])\n",
    "\n",
    "    # TabPFN seed (head is frozen; but its internal rng can matter)\n",
    "    tabpfn_seed = trial.suggest_categorical(\"tabpfn_seed\", [0, 1, 2, 3, 4, 42])\n",
    "\n",
    "    # ---- GO-LR ONCE per trial ----\n",
    "    go = GraphFeatureOrdering(\n",
    "        num_clusters=int(go_k),\n",
    "        metric=go_metric,\n",
    "        refine=True,\n",
    "        direction_select=bool(go_direction),\n",
    "        refine_passes=int(go_refine_passes),\n",
    "    )\n",
    "\n",
    "    try:\n",
    "        # Prefer GPU kmeans\n",
    "        Pi_star, _, _, _ = go.fit(X_all, seed=SEED, deterministic=True, use_cpu_kmeans=False)\n",
    "    except RuntimeError as e:\n",
    "        # Fallback to CPU kmeans if GPU path OOMs/fails\n",
    "        cleanup_cuda()\n",
    "        try:\n",
    "            Pi_star, _, _, _ = go.fit(X_all, seed=SEED, deterministic=True, use_cpu_kmeans=True)\n",
    "        except Exception:\n",
    "            raise optuna.TrialPruned(f\"GO-LR failed (metric={go_metric})\")\n",
    "\n",
    "    # ---- 5x5 CV: NSC+TabPFN per fold using fixed Pi_star ----\n",
    "    head_cfg = TabPFN25Config(\n",
    "        task_type=\"multiclass\",\n",
    "        num_classes=int(NUM_CLASSES),\n",
    "        device=TABPFN_DEVICE,\n",
    "        random_state=int(tabpfn_seed),\n",
    "    )\n",
    "\n",
    "    accs = []\n",
    "    for fold_id, (tr_idx, va_idx) in enumerate(rkf.split(X_all, y_all), start=1):\n",
    "        X_tr = X_all[tr_idx]\n",
    "        y_tr = y_all[tr_idx]\n",
    "        X_va = X_all[va_idx]\n",
    "        y_va = y_all[va_idx]\n",
    "\n",
    "        # NSC config on TRAIN only\n",
    "        nsc = PIDFSegPCA(\n",
    "            segmentation=nsc_seg,\n",
    "            l_min=int(nsc_lmin),\n",
    "            m_rule=nsc_m_rule,\n",
    "            gamma=float(nsc_gamma),\n",
    "            beta=float(nsc_beta),\n",
    "            tau=float(nsc_tau),\n",
    "            M_min=int(nsc_Mmin),\n",
    "            M_max=int(nsc_Mmax),\n",
    "            assume_standardized=bool(assume_standardized),\n",
    "            device=NSC_DEVICE,\n",
    "        )\n",
    "\n",
    "        deltas = None if nsc_seg == \"uniform\" else compute_deltas_adjacent_corr(X_tr, Pi_star)\n",
    "\n",
    "        X_tr_t = torch.from_numpy(X_tr)\n",
    "        nsc.configure(Pi_star=Pi_star, X_train=X_tr_t, tau=float(nsc_tau), deltas=deltas)\n",
    "\n",
    "        Z_tr = nsc.compress(X_tr_t, mode=\"flatten\").cpu().numpy()\n",
    "        Z_va = nsc.compress(torch.from_numpy(X_va), mode=\"flatten\").cpu().numpy()\n",
    "\n",
    "        # TabPFN fit/eval\n",
    "        head = TabPFN25Head(head_cfg)\n",
    "        head.fit(Z_tr, y_tr)\n",
    "\n",
    "        P = head.predict_proba(Z_va)\n",
    "        pred = np.argmax(P, axis=1)\n",
    "        acc = float(accuracy_score(y_va, pred))\n",
    "        accs.append(acc)\n",
    "\n",
    "        # prune on running mean\n",
    "        trial.report(float(np.mean(accs)), step=fold_id)\n",
    "        if trial.should_prune():\n",
    "            cleanup_cuda()\n",
    "            raise optuna.TrialPruned()\n",
    "\n",
    "        cleanup_cuda()\n",
    "\n",
    "    mean_acc = float(np.mean(accs))\n",
    "    std_acc  = float(np.std(accs, ddof=1))\n",
    "    trial.set_user_attr(\"mean_acc\", mean_acc)\n",
    "    trial.set_user_attr(\"std_acc\", std_acc)\n",
    "    return mean_acc\n",
    "\n",
    "# -----------------------\n",
    "# Run Optuna\n",
    "# -----------------------\n",
    "sampler = optuna.samplers.TPESampler(seed=SEED, multivariate=True, group=True)\n",
    "pruner  = optuna.pruners.MedianPruner(n_warmup_steps=10)  # warmup because 25 folds\n",
    "\n",
    "study = optuna.create_study(direction=\"maximize\", sampler=sampler, pruner=pruner)\n",
    "study.optimize(objective, n_trials=N_TRIALS, show_progress_bar=True, gc_after_trial=True, n_jobs=1)\n",
    "\n",
    "best = study.best_trial\n",
    "print(\"\\n================ BEST TRIAL ================\")\n",
    "print(f\"mean_acc ± std_acc = {best.user_attrs.get('mean_acc', best.value):.6f} ± {best.user_attrs.get('std_acc', float('nan')):.6f}\")\n",
    "print(\"\\nBest hyperparameters:\")\n",
    "for k, v in best.params.items():\n",
    "    print(f\"  {k}: {v}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1c7dbbf3-9d55-4fd1-b696-5387a0fd1cad",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
