data:
    dataset: "visda"
    seed: 
    num_classes: 12
    num_workers: 4
    dataroot: './data_list/VisDA'
    source_domain: 'train'
    target_domain: 'validation'

model:
    data_dim: 256
    hidden_dim: 512
    feature_dim: 256
    var_type: fixedlarge
    ema_rate: 0.9999
    ema: True

diffusion:
    beta_schedule: linear  # cosine_anneal, cosine
    beta_start: 0.0001 #
    beta_end: 0.02 #
    timesteps: 1000 #
    aux_cls:
        h_dim: 512 #
        z_dim: 256 #
        pre_train: True #
        joint_train: False #
        n_pretrain_epochs: 1 #
        source_pretrain_epochs: 0 #
        logging_interval: 1 #
    
training:
    batch_size: 32
    weight_kl: 1.0 ##
    weight_kd: 1.0 ##
    weight_transfer: 1.0 ##
    n_epochs: 1 ###
    open_backbone: False
    warmup_epochs_adaptation: 1
    warmup_epochs_diffusion: 1
    snapshot_freq: 1000000000
    validation_freq: 50
    active: 'ttest'

testing:
    batch_size: 32
    sampling_size: 1000
    n_samples: 100
    n_bins: 10
    PICP_range: [2.5, 97.5]

optim:
    weight_decay: 0.000
    optimizer: "Adam"
    lr: 0.001
    beta1: 0.9
    amsgrad: False
    eps: 0.00000001
    grad_clip: 1.0
    lr_schedule: True
    min_lr: 0.0

aux_optim:
    weight_decay: 0.001
    optimizer: "SGD"
    lr: 0.01
    beta1: 0.9
    amsgrad: True
    eps: 0.00000001
    grad_clip: 1.0