# UNet archtecture (ddpm++ arch)
img_resolution: 32
img_channels: 1
label_dim: 10 # number of classes
model_type: 'MultiHeadSongUNet'
embedding_type: 'positional'
encoder_type: 'standard'
decoder_type: 'standard'
channel_mult_noise: 1
resample_filter: [1,1]
model_channels: 128
channel_mult: [2,2,2]
dropout: 0.13
label_dropout: 0

# Precond
sigma_max: 80.0
sigma_min: 0.002
sigma_data: 0.5

# Loss
P_mean: -1.2
P_std: 1.2
sigma_data: 0.5

# EMA
ema_halflife_kimg: 500
ema_rampup_ratio: 0.05