seed: null

data:
  dataset: mnist  #tinyimagenet, celeba, celebahq, etc.
  channels: 1
  image_size: 32
  random_flip: true
  n_samples: 60000 # max number of samples to use for training
  #num_classes: 10


method: dlpm # dlpm

dlpm:
  alpha: 2.0
  reverse_steps: 4000
  rescale_timesteps: true
  input_scaling: false


diffusion:
  T: 1.0
  process_type: VP # VE or VP
  schedule: cosine
  rescale_timesteps: true # rescale the timesteps to [0, 1]
  
  learn_variance: false # learn the variance
  conditional: false # conditional diffusion

eval:
  data_to_generate: 2000
  real_data: 2000
  batch_size: 256

  diffusion:
    epsilon: 0.00001
    deterministic: false # set to true for ode sampling
    reverse_steps: 500
    clip_denoised: true # clip denoised data to [0, 1]
    ei_integrator: true

  dlpm:
    deterministic: false # set to true for ddim sampling
    reverse_steps: 500
    clip_denoised: true # clip denoised data to [0, 1]
    ei_integrator: true


model:
  architecture: 'unet'
  unet:
    model_type: ddpm
    attn_resolutions: [2, 4]
    channel_mult: [1, 2, 2, 2]
    dropout: 0.0 #0.1
    model_channels: 32
    num_heads: 4
    num_res_blocks: 2


training:
  batch_size: 256
  num_workers: 2

  diffusion:
    ema_rates:
    - 0.999
    grad_clip: 1.0
  
  dlpm:
    ema_rates:
    - 0.999
    grad_clip: 1.0

optim:
  optimizer: adamw
  momentum: 0.
  temperature: 1.0 # 0.00001
  schedule: null #steplr
  lr: 0.0001
  warmup: 200 
  lr_steps: 1000000
  lr_step_size: 5000
  lr_gamma: 0.95

run:
  steps: 10000
  eval_freq: null
  checkpoint_freq: null
  progress: false # print progress bar
  id: null # experiment id
  fp16: false # use fp16

