model_name: 'tabbyflow'

data:
  cont_scaler: 'quantile'
  cat_encoding:  # empty (None) / onehot
  drop_cont_missing: True
  standardize_data: False
  dequant_data: False

model:
  num_layers: 2
  d_token: 4
  n_head: 1
  factor: 32
  bias: True
  dim_t: 256
  use_mlp: True
  n_units: 801
  n_layers: 5

train:
  # epochs: 8000
  train_steps: 30000
  lr: 0.001
  weight_decay: 0
  ema_decay: 0.997
  batch_size: 4096
  check_val_every: 100000
  lr_scheduler: "reduce_lr_on_plateau"
  factor: 0.90           # hyperparam for reduce_lr_on_plateau
  reduce_lr_patience: 50        # hyperparam for reduce_lr_on_plateau
  closs_weight_schedule: "anneal"
  c_lambda: 1.0
  d_lambda: 1.0
