_module: ssdd

encoder:
  _module: vq_encoder
  z_dim: 4
  patch_size: 8

decoder:
  _module: uvit
  size: M
  z_dim: ${ae.encoder.z_dim}

fm_trainer:
  _module: flow_matching
  timescale: 1_000


fm_sampler:
  _module: euler
  steps: 8

ema:
  decay: 0.999
  start_iter: 50_000

init:
  method: kaiming_normal
