import: [lookup_embedder]

trme:
  transformer_impl: pytorch
  use_preln: false
  use_rat: false
  dim: -1
  nlayer: 2
  nhead: 2

  # default values match the same number in pytorch implementation
  ff_dim: 2048 # transformer FFN dimension
  hidden_dropout: 0.1 # transformer hidden dropout
  attn_dropout: 0.1 # transformer attention dropout
  ctx_dropout: 0.5 # neighbor discrete dropout
  output_dropout: 0.0 # entity embedding dropout in output
  rel_dropout: 0.0
  self_dropout: 0.0
  mlm_mask: 0.6
  mlm_replace: 0.3
  add_mlm_loss: true
  activation: relu
  max_context_size: 0
  similarity: DotProduct
  initializer_range: 0.02 # transformer Linear and Embedding weight normal distribution std
  entity_embedder:
    type: lookup_embedder
    +++: +++
  relation_embedder:
    type: lookup_embedder
    +++: +++


  class_name: TrmE
  semantic_encoding: false
  semantic_encoding_decay_weight: 0.9 # exponentially decay rate
  semantic_encoding_loss: false
  max_hop: 1 # allowed max-hop for shortest distance path
  semantic_partition: false
  # alter: alternative optimize the output in different batches
  # avg: average the outputs of two partitions
  # cat: concat two outputs
  dual_partiton_mode: avg
  update_semantic_partition_freq: 10 # update the semantic_partition every n epoches 