data:
  csv_path: data/raw/zinc250k.csv
  smiles_col: smiles
  max_len: 128
  subset: null
  representation: selfies

vae:
  d_model: 128
  nhead: 8
  enc_layers: 6
  dec_layers: 6
  dim_ff: 1024
  dropout: 0.1
  K: 8
  latent_dim: 128
  beta: 0.1

train:
  seed: 42
  epochs: 150
  batch_size: 256
  lr: 1.0e-4
  lr_schedule: cosine
  lr_min: 0.0
  beta_warmup_frac: 0.35
  grad_clip: 1.0

output:
  workdir: outputs/pretrain_zinc250k_selfies_cosine
