gradient_accumulation_steps: 1
max_grad_norm: 1.0
num_train_epochs: -1

ddconfig:
  ema: true

  diff_latent_res_H: 128 # 88 40
  diff_latent_res_W: 128 # 48 96

  base_learning_rate: 1.0e-4

  timesteps: 1000
