# @package _global_
dataset:
  max_number: 1000

model:
  multi:
    optimizer:
      learning_rate: 0.005
    batch_size: 64
    seq_hidden_units: 18
    br_size: 18
    fc_hidden_units: 14
    dropout_rate: 0.1
    num_layer: 1
    num_heads: 3

    self_positional_encoding:
      max_relative_position: 15

exp:
  weights_ema: True
  alpha: 0.01
  beta: 0.99
  balancing: domain_confusion
  max_epochs: 2000
