lr = 0.00017654048052495074
batch_size = 64
d_layers = [206, 243, 243, 233]
weight_decay = 0.0048696409415209
optimizer_type = "AdamW"

epochs = 316
patience = 17

[data]
dataset_id = 1471

[model]
num_classes = 2
use_gpu = true
d_embedding = 8

[training]
max_epochs = 500  
min_delta = 1e-4  
verbose = true

max_grad_norm = 5.0

[output]
save_best_model = true
save_trial_history = true
backup_results = true
model_save_path = "best_mlp_model.pt"
config_save_path = "best_mlp_config.toml"