# @package _global_

dataset:
    coeff: 

model:
    name: CT
    encoder:
        seq_hidden_units: 16 #32   #16
        br_size         : 16 #32   #16
        fc_hidden_units : 32
        dropout_rate    : 0.1   
        train_batch_size: 256
        self_positional_encoding:
            max_relative_position: 15
        optimizer:
            learning_rate: 0.01

exp:
    # environment
    seed: 
    gpu:  0
    max_epochs: 150
    
    # for balancing
    balancing: domain_confusion       # grad_reverse / domain_confusion
    alpha: 0.01                    # Has no full effect, if update_alpha is True
    update_alpha: True            # Exponential growth of alpha from 0.0 to 1.0
    alpha_rate: exp

    # for ema
    weights_ema: True            # Exponential moving average of weights
    beta: 0.99                    # EMA beta

    # balancing
    bce_weight: False             # Weight in BCE loss, proportional to treatment frequency
