parent: research/conditional/train/configs/baselines/gpt/dense/common.yaml
md5_parent_hash: 19b288a05a2e35404e144b2f938d7bd8

params:
  dmodel: 1024
  dff: 2048
  n_blocks: 24
  n_att_heads: 16
