type: "Transformer"

base_model_type: "Transformer" # This is the type of the model as baseline

#model configuration
input_size: ${dataset.x_dim}
d_model: 32
d_ff: 128
n_heads: 8

e_layers: 3


#Optimization configuration
batch_size: 128
num_epochs: 500

lr: 1e-3
weight_decay: 1e-6
dropout: 0

