model_type: gpt

gpt_params:
  n_layer: 24
  n_head: 16
  n_embd: 1024
  dropout: 0.2
  bias: false

