lr = 0.00018232197794903611
weight_decay = 0.004247058562261873
batch_size = 512
n_layers = 1
n_sub_first = 4
n_sub_middle = 1
optimizer_type = 'adamw'

[data]
dataset_id = 1490

[model]
algorithm = "BL"
[training]
verbose = false
patience = 20

use_gpu = true
eval_batch_size = 512
max_epochs = 600