exp:
  num_epochs: 1000 
  batch_size: 128
  learning_rate: 1e-5
  loss_fn: mae              
  target_metric: rmse

  patience: 1000
  optimizer:
    type: "Adam"
  scheduler:
    type: "ExponentialLR"
    gamma: 0.999
  memory_update_interval: 1

model:
  model_type: multi_anchor_smi
  smi_ted_version: light 
  path: ./baselines/smi_ted/saved_results
  ckpt_path: smi_ted_Light_40.pt
  n_output: 1
  train_decoder: 1
  
  latent_dim: 768
  num_heads: 4
  freeze_encoder: true 

transducer:
  num_candidates: 10             # Fixed number of anchors retrieved (k)

  sampling_strategy: "topk" # Use adaptive masking strategy
  anchor_metric: "euclidean"         # Use Euclidean distance (factor > 1 usually)
  use_anchor_weights: false          # Don't use weights as features

  # --- Adaptive parameters ---
  adaptive_mask:
    k_min: 2                  # Min effective k
    k_max: 5                  # Max effective k (<= num_candidates)
    density_threshold_factor: 1.5 # Threshold multiplier (tune based on distance scale)

  diverse_topm:
    diversity_factor: 2
