global:
  device: 'auto'  # 'auto', 'cpu', 'cuda', 'cuda:0'

save_wsi_features: false 


classifiers:
  homil:
    hidden_dim: 64
    dropout_rate: 0.4
    enable_visualization: true
    viz_save_dir: 'homil_visualizations'
    viz_update_freq: 10
    conv_num_kernels: 4
    cov_extraction_method: 'conv_pooling'  # 'weighted_rows', 'upper_triangle', 'sqrt_upper_triangle', 'conv_pooling'
    conv_kernel_size: 64
    fusion_method: 'attention'
    learning_rate: 0.0001
    weight_decay: 1e-5
    epochs: 100
    batch_size: 4

    newton_schulz_iters: 5
    newton_schulz_eps: 1e-8

  attention:
    hidden_dim: 64
    dropout_rate: 0.4
    learning_rate: 0.0005
    weight_decay: 1e-5
    epochs: 100
    batch_size: 16

  mean_pooling:
    hidden_layers: [256, 128]
    dropout_rate: 0.3
    activation: 'relu'
    learning_rate: 0.0005
    weight_decay: 1e-5
    epochs: 100
    batch_size: 32

  max_pooling:
    hidden_layers: [256, 128]
    dropout_rate: 0.3
    activation: 'relu'
    learning_rate: 0.0005
    weight_decay: 1e-5
    epochs: 100
    batch_size: 32 

  transmil:
    input_dim: 512          
    hidden_dim: 64          
    optimizer_type: 'adamw'  
    scheduler_type: 'cosine'   
    warmup_epochs: 5          
    learning_rate: 0.0005    
    weight_decay: 1e-5      
    epochs: 100            
    batch_size: 16         

  clam_sb:
    gate: true     
    size_arg: "small"    
    dropout: 0.25      
    k_sample: 8           
    subtyping: false      
    learning_rate: 0.0005      
    weight_decay: 1e-5  
    batch_size: 16     
    bag_weight: 0.7      
    instance_weight: 0.3    
    epochs: 100            
    early_stopping: false   
    patience: 20             

  clam_mb:
    gate: true               
    size_arg: "small"     
    dropout: 0.25          
    k_sample: 8             
    subtyping: false   
    learning_rate: 0.0005    
    weight_decay: 1e-5    
    batch_size: 16        
    bag_weight: 0.5      
    instance_weight: 0.5  
    epochs: 100            
    early_stopping: false  
    patience: 20          


  s4mil:
    hidden_dim: 64  
    d_state: 4  
    dropout_rate: 0.4    
    learning_rate: 0.0005   
    weight_decay: 1e-5  
    epochs: 100           
    batch_size: 16       
    early_stopping: false    
    patience: 20           