parent: research/conditional/train/configs/baselines/gpt/dense/common.yaml
md5_parent_hash: 19b288a05a2e35404e144b2f938d7bd8

params:
  dmodel: 256
  dff: 1024
  n_blocks: 8
  n_att_heads: 4
