architecture:
  _target_: krt.models.gnp.gnp.GNP
  embedding_dim: 64
  nhead: 4
  graph_depth: 4
  decoder_depth: 2
  edge_type: 'L2'
training:
  epochs: 10000
  early_stop_patience: 500
  learning_rate: 3e-4
  weight_decay: 0.0
  lr_schedule: False
