# @package _global_
dataset:
  coeff: 2.0

model:
  encoder:
    seq_hidden_units: 12
    br_size: 4
    fc_hidden_units: 2
    dropout_rate: 0.1
    num_layer: 2
    batch_size: 256
    optimizer:
      learning_rate: 0.01

    self_positional_encoding:
      max_relative_position: 15

  train_decoder: True
  decoder:
    optimizer:
      learning_rate: 0.001
    batch_size: 512
    br_size: 3
    fc_hidden_units: 9
    dropout_rate: 0.1
    num_layer: 2

    cross_positional_encoding:
      max_relative_position: 15

exp:
  weights_ema: False
  balancing: grad_reverse