lr = 0.004880610344470438
weight_decay = 0.06711612414860951
batch_size = 256
n_layers = 3
n_sub_first = 40
n_sub_middle = 8
n_sub_last = 6
optimizer_type = 'adamw'

[data]
dataset_id = 42192

[model]
algorithm = "BL_shallow"

[training]
verbose = false
patience = 20

use_gpu = true
max_epochs = 500