model_name: 'lowres'

data:
  cat_encoding:  # empty (None) / onehot

model:
  variant: 'flow' # flow / cdtd
  mlp_act: 'relu' # relu / silu
  mlp_n_layers: 4
  mlp_n_units: 512
  mlp_emb_dim: 256
  cat_emb_dim: 16
  cat_emb_init_sigma: 0.001
  normalize_by_entropy: True # whether to normalize feature-specific losses by entropies
  learn_noise_schedule: True
  init_embs_zero: False  # whether to initialize embeddings at zero
  learn_latents: True  # whether to learn latent representations for noise schedule
  norm_dim:

  # configurations of the noise schedule / timewarping
  timewarp_variant: 'logistic' # logistic / pwl
  timewarp_weight_low_noise: 3.0 # 1.0 = uniform initialization for logistic timewarping
  sigma_min: 0
  sigma_max: 100
  sigma_data: 1.0

  # for generation
  generation_steps: 200
  generation_batch_size: 4096

training:
  num_steps_train: 30_000
  batch_size: 4096
  log_steps: 100
  lr: 0.001
  weight_decay: 0
  betas: [0.9, 0.999]
  ema_decay: 0.999
  freeze_emb: True
  clip_grad: False
  scheduler: True
  num_steps_warmup: -1 # set to -1 to disable
  use_val: False
  patience: 10