_target_: models.toy_transformer.ToyTransformer
add_qk_attention: false
add_positional_encoding: false
cat_positional_encoding: true
embedding_dim: 64 # Default, only used if add_embedding=true
head_dim: 64 # Default, only used if add_qk_attention=true
n_layers: 1
n_heads: 1