# @package _global_
dataset:
  coeff: 4.0

model:
  encoder:
    seq_hidden_units: 18
    br_size: 18
    fc_hidden_units: 18
    dropout_rate: 0.1
    num_layer: 2
    batch_size: 64
    optimizer:
      learning_rate: 0.001

    self_positional_encoding:
      max_relative_position: 15

  train_decoder: True
  decoder:
    optimizer:
      learning_rate: 0.0001
    batch_size: 256
    br_size: 12
    fc_hidden_units: 48
    dropout_rate: 0.1
    num_layer: 2

    cross_positional_encoding:
      max_relative_position: 15

exp:
  weights_ema: False
  balancing: grad_reverse