seed_everything: 0
model:
  class_path: wavesAI.task.sequence_modeling.SequenceModeling # This defines the task. Set this to the full import name of the task to perform
  init_args:
    scheduler_interval: step
    scheduler_frequency: 1
    network:
      class_path: wavesAI.model.mamba_optimized_v2.MambaSeq2Seq # this defines the model. Set it to the full import name of the model
      init_args: # This contains key: value pairs of arguments to the model
        layers: m|a
    optimizer:
      class_path: torch.optim.AdamW
      init_args:
        lr: 0.001
        weight_decay: 0.0001
    scheduler:
      class_path: torch.optim.lr_scheduler.CosineAnnealingWarmRestarts
      init_args:
        eta_min: 0.00001
        T_0: 3900
        T_mult: 2
data:
  class_path: wavesAI.data.formal_language.FormalLanguageStreaming
  init_args:
    seed: 0
    min_train_length: 6
    max_train_length: 40
    min_test_length: 41
    max_test_length: 256
    task_name: repetition
    batch_size: 256
    vocab_size: 12
    num_workers: 4
    pin_memory: false
optimizer: null
lr_scheduler: null
ckpt_path: null
trainer:
  default_root_dir: "/scratch3/workspace/user/output/test"  # Save path TODO: VERIFY
  max_epochs: null
  max_steps: 100000
  val_check_interval: 500
  accelerator: auto
  strategy: auto
  devices: auto
  num_nodes: 1
  precision: null
  logger:
    class_path: lightning.pytorch.loggers.WandbLogger
    init_args:
      project: "algorithmic"  # Project name TODO: VERIFY BEFORE USING IN EXPERIMENTS
      log_model: False
      save_dir: ${trainer.default_root_dir}  # experiment root directory TODO: VERIFY BEFORE USING IN EXPERIMENTS
  callbacks:
    - class_path: lightning.pytorch.callbacks.ModelCheckpoint
      init_args:
        monitor: validation_accuracy
        mode: max
  fast_dev_run: false
  min_epochs: null
  min_steps: null
  max_time: null
  limit_train_batches: null
  limit_val_batches: 100
  limit_test_batches: null
  limit_predict_batches: null
  overfit_batches: 0.0
  check_val_every_n_epoch: null
  num_sanity_val_steps: null
  log_every_n_steps: 50
  enable_checkpointing: null
  enable_progress_bar: null
  enable_model_summary: null
  accumulate_grad_batches: 1
  gradient_clip_val: 1.0
  gradient_clip_algorithm: null
  deterministic: true
  benchmark: null
  inference_mode: true
  use_distributed_sampler: true
  profiler: null
  detect_anomaly: false
  barebones: false
  plugins: null
  sync_batchnorm: false
  reload_dataloaders_every_n_epochs: 0
