seed: null

data:
  dataset: gmm_grid     # gaussian mixture grid
  d: 4                  # data dimension
  n: 3                  # n*n mixture components
  
  n_samples: 5000      # number of samples in the dataset
  random_means: true    # randomize the means of the mixture components
  
  std: 0.1
  theta: 2.0
  weights:
  # - 0.01
  # - 0.99
  - 0.01
  - 0.1
  - 0.3
  - 0.2
  - 0.02
  - 0.15
  - 0.02
  - 0.15
  - 0.05

method: diffusion

diffusion:
  T: 1.0
  process_type: VP # VE or VP
  schedule: cosine
  rescale_timesteps: true # rescale the timesteps to [0, 1]
  
  learn_variance: false # learn the variance
  conditional: false # conditional diffusion

eval:
  data_to_generate: 25000
  real_data: 25000
  batch_size: 4096

  diffusion:
    epsilon: 0.000001
    deterministic: false # set to true for ode sampling
    reverse_steps: 1000
    clip_denoised: false # clip denoised data to [0, 1] or [-1, 1]
    ei_integrator: true


model:
  architecture: 'mlp'
  mlp:
    act: silu
    dropout_rate: 0.0
    layer_norm: true
    nblocks: 3
    nunits: 32
    skip_connection: true
    time_emb_size: 32


training:
  batch_size: 512
  num_workers: 0

  diffusion:
    refresh_data: false # resample the dataset at each epoch. Dataset object must implement refresh method 

    normalize: true # normalize the data from [0, 1] to [-1, 1]
    
    ema_rates:
    #- 0.9
    grad_clip: null #1.0

optim:
  optimizer: adamw
  momentum: 0.
  temperature: 0.00001
  schedule: null # linear, steplr
  lr: 0.001
  warmup: 0 #1000
  lr_steps: 2000
  lr_step_size: 400
  lr_gamma: 0.99

run:
  epochs: 20
  eval_freq: null
  checkpoint_freq: null
  stop_lower_loss_threshold: null
  progress: false # print progress bar
  id: null # experiment id
  fp16: false # use fp16

