architecture:
  _target_: krt.models.gtnp.GTNP
  d_model: 64
  nhead: 4
  num_blocks: 6
  x_embed_types: 'mlp'
  edge_types: 'L2'
training:
  epochs: 10000
  early_stop_patience: 500
  learning_rate: 5e-4
  weight_decay: 0.0
  lr_schedule: True
