---
defaults:
  - wordlmtransformer_base
  - _self_

num_attn_heads: 8
num_layers: 8
input_dim: 512
attn_hidden_dim: 64
fc_hidden_dim: 2048
