default: &DEFAULT
  arch: 'transformer' 
  verbose: True

  transformer:
    dropout: 0.1
    num_encoder_layers: 6
    num_decoder_layers: 6
    n_head: 16
    d_model: 512
    source_sequence_length: 200
    target_sequence_length: 200
  
  data:
    batch_size: 64
