run_params:
  debug_mode: false
  enable_wandb: true
  run_string: "autoencoder_kl"

training_params:
  preload_model: null
  micro_batch_size: 3
  normalize_dataset: true
  num_epochs: 250
  num_workers: 12
  warmup_generator_epochs: 35
  early_stopping_patience: 50
  gradient_clip_val: 1.0

optimizer_params:
  learning_rate: 1.0e-4
  optimizer_type: "adamw"
  weight_decay: 1.0e-5

scheduler_params:
  scheduler_type: "cosine"
  lr_plateau_factor: 0.2
  lr_plateau_patience: 6
  lr_cosine_warmup_iter_percentage: 0.2
  lr_cosine_min_warmup_lr_ratio: 0.1
  lr_cosine_min_lr_ratio: 1.0e-3

model_params:
  latent_channels: 4
  norm_num_groups: 32
  layers_per_block: 2
  act_fn: "silu"
  block_out_channels: [128, 256, 512, 512]
  down_block_types:
    [
      "DownEncoderBlock2D",
      "DownEncoderBlock2D",
      "DownEncoderBlock2D",
      "DownEncoderBlock2D",
    ]
  up_block_types:
    [
      "UpDecoderBlock2D",
      "UpDecoderBlock2D",
      "UpDecoderBlock2D",
      "UpDecoderBlock2D",
    ]

loss_params:
  kl_weight: 1.0e-4
  disc_weight: 0.5
