parent: research/conditional/train/configs/baselines/gpt/dense/common.yaml
md5_parent_hash: 19b288a05a2e35404e144b2f938d7bd8

params:
  dmodel: 768
  dff: 3072
  n_blocks: 12
  n_att_heads: 12
