runner: "research.conditional.train.cc_train"
time: 2-00:00:00
n_gpus: 1
interactive_debug: false

# train params
params:
  name: "baseline"

  # base bass
  mixed_precision: true
  flash_attention: true

  # logging etc.
  use_neptune: true
  project_name: "SECRET_PROJECT_NAME"
  logging_interval_heavy: 5000
  logging_interval_loss: 1000
  save_weights_path: "model_ckpt"
  save_weights_interval: 25_000

  # shallower bass
  cutoff: 256
  batch_size: 256
  n_steps: 275_000
  final_lr_step: 250_000
  scheduler: cosine
  lr_warmup_steps: 2500
  final_lr_fraction: 0.1

  grad_clip: 0.5
