# hybrid_eval_config.yaml

data:
  
  valid_path: "./tsp_data/tsp_solutions_valid10000_n50_s7991_solver_concorde.npz" 
  test_path: "./tsp_data/tsp_solutions_test1280_n50_s4321_solver_concorde.npz"  
  #test_path: "./tsp_data_n100/tsp_maps_n100_valid15000_v2_seed42.npz"  # [新增] 对应的最优解路径




model: 
  num_nodes: 50
  node_coord_dim: 2
  pos_embed_num_feats: 64
  node_embed_dim: 128
  prefix_enc_hidden_dim: 256
  prefix_cond_dim: 256
  gnn_n_layers: 12
  gnn_hidden_dim: 256
  gnn_aggregation: "sum"
  gnn_norm: "layer"
  gnn_learn_norm: true
  gnn_gated: true
  time_embed_dim: 256


rl_model:
  name: POMO  
  problem: 'tsp'
  ckpt_path: "./rl4co_main/RL_ckpt/pomo50_400e.ckpt" #    logs/train/runs/tsp100/am-tsp100/2025-05-22_09-06-34/checkpoints/epoch_099.ckpt

# Diffusion
dm_model:
  #ckpt_path: "./ckpt_tsp_difusco_style_new/tsp_conditional_diffusion_epoch_70.pth" 
  ckpt_path: "./ckpt_tsp_difusco_style_tsp50/Final_0_20_best_model_checkpoint.pth"
diffusion:
  num_timesteps: 1000
  schedule_type: 'cosine'


eval:
  batch_size: 1 
  num_inference_steps: 20
  inference_schedule_type: 'cosine'
  apply_two_opt: False
  num_samples_to_visualize: 5
  two_opt_max_iterations: 50

solver:

  use_theory_trigger: true 
  

  probe_rl_top_m:  15 #10 best but time 174; 6 time 77

  dm_probe_timestep: 500

  dm_prior_temp: 0.1 #0.1

  adaptive_m_p_thresh: 0.8

  entropy_threshold: 1.2
  kl_div_threshold: 4  
  

  dm_inference_steps: 10
  dynamic_n_cumulative_threshold: 0.6
  apply_two_opt: False