default: &DEFAULT
  arch: 'gpt2' 
  verbose: True

  gpt2:
    model: 'GPT2-large'
    dropout: 0.1
    sequence_length : 256
  
  data:
    batch_size: 16
    