model_name: 'flexmoe'

# -----------------------
# Task Configuration
# -----------------------
task: 'phenotype'
num_classes: 25
input_dim: 49

# -----------------------
# Encoder Selection
# -----------------------
ehr_encoder: 'transformer'        # lstm, transformer
cxr_encoder: 'resnet50'    # resnet50, vit_b_16
pretrained: true

# -----------------------
# EHR Encoder Parameters
# -----------------------
# LSTM specific
ehr_num_layers: 1
ehr_bidirectional: true

# Transformer specific
ehr_n_head: 4
ehr_n_layers: 1

# -----------------------
# FlexMoE Architecture
# -----------------------
hidden_dim: 256
num_patches: 16
num_layers: 1
num_layers_pred: 1
num_experts: 16
num_routers: 1
top_k: 4
num_heads: 4
dropout: 0.2

# -----------------------
# Training Configuration
# -----------------------
lr: 0.0001
gate_loss_weight: 0.01
epochs: 50
patience: 10

use_label_weights: false  # Enable/disable label weights
label_weight_method: balanced  # Options: 'balanced', 'inverse', 'sqrt_inverse', 'log_inverse', 'custom'

# -----------------------
# finetune parameters
# -----------------------
# num_experts: 2、4、8、16、32
# num_routers: 1、2
# gate_loss_weight: 0.001、0.01、0.1
# top_k: 2、4、8、16



