parent: research/conditional/train/configs/baselines/gpt/dense/common.yaml
md5_parent_hash: 19b288a05a2e35404e144b2f938d7bd8

params:
  dmodel: 512
  dff: 2048
  n_blocks: 4
  n_att_heads: 8
