lr = 0.0017583640270008513
batch_size = 32
d_layers = [37, 56, 39]
weight_decay = 0.00035127047262708476
optimizer_type = "AdamW"

epochs = 323
patience = 20

[data]
dataset_id = 40691

[model]
num_classes = 6
use_gpu = true
categories = [] 

d_embedding = 8

[training]
max_epochs = 500 
min_delta = 1e-4 
verbose = true
max_grad_norm = 5.0

[output]
save_best_model = true
save_trial_history = true
backup_results = true
model_save_path = "best_mlp_model.pt"
config_save_path = "best_mlp_config.toml"