# @package _global_

dataset:
    coeff: 

model:
    name: EDCT
    encoder:
        seq_hidden_units: 18
        br_size         : 18
        fc_hidden_units : 18
        dropout_rate    : 0.1
        train_batch_size: 128
        num_layer       : 2
        self_positional_encoding:
            max_relative_position: 15
        optimizer:
            learning_rate: 0.01
    decoder:
        br_size         : 4
        fc_hidden_units : 8
        dropout_rate    : 0.5   
        num_layer       : 2
        train_batch_size: 1024
        optimizer:
            learning_rate: 0.001 

exp:
    # environment
    seed: 
    gpu:  0
    max_epochs: 100
    
    # for balancing
    balancing: domain_confusion       # grad_reverse / domain_confusion
    alpha: 0.01                    # Has no full effect, if update_alpha is True
    update_alpha: True            # Exponential growth of alpha from 0.0 to 1.0
    alpha_rate: exp

    # for ema
    weights_ema: True            # Exponential moving average of weights
    beta: 0.99                    # EMA beta

    # balancing
    bce_weight: False             # Weight in BCE loss, proportional to treatment frequency
