# Time-reversed Diffusion Sampler (DIS)
name: dis
step_size: ${target.dis.step_size}
batch_size: ${target.all.batch_size}
iters: 40000
init_std: ${target.dis.initial_scale}
num_steps: 128
loss: "elbo"  # elbo or var_grad
grad_clip: 1.
max_diffusion: 10.0 #${target.dis.max_diffusion,10.0} #10.

defaults:
  - model: pisgrad_net
  - noise_schedule: cosine

model:
  bias_init: 1.  # Initialization of the last layers' bias of the time-dependent network
  weight_init: 1e-8  # Initialization of the last layers' weights of the time-dependent network