defaults: 
 - base
 - s4nd_dualseq
 - override /step: one_to_seq
 - _self_

name: s4nd_onetoseq

version: 1.5

onetoseq: True

params:
  d_model: 128
  # n_layers: 8
  # layer_input_processors: ["BatchSpace","BatchTime","BatchSpace", "BatchTime","BatchSpace","BatchTime","BatchSpace", "BatchTime"]
  # layer_output_processors: ["UnbatchSpace","UnbatchTime","UnbatchSpace", "UnbatchTime","UnbatchSpace","UnbatchTime","UnbatchSpace","UnbatchTime"]
  # s4block_args:
  #   d_state: 256
    # bidirectional: [False, True, False, True, False, True, False, True]

optimizer:
  _target_: optimizers.setup_s4_optimizer
  lr: 0.001
  weight_decay: 0.0
  # weight_decay: 0.0

batch_size: 4

# # scheduler: None
# scheduler: cosine
scheduler: cosine
step_size: 150
gamma: 0.5

warmup_epochs: 0.25