lr = 0.0002995991532241214
weight_decay = 0.0010033289979636665
batch_size = 128
n_layers = 2
n_sub_first = 40
n_sub_middle = 8
n_sub_last = 6
optimizer_type = 'adamw'

[data]
dataset_id = 1120

[model]
algorithm = "BL_shallow"

[training]
verbose = false
patience = 20

use_gpu = true
eval_batch_size = 2048
max_epochs = 500