defaults: 
 - base
 - /step: sequential_markov
 - _self_

name: gnot

params:
  _target_: models.gnot.mmgpt.GNOT
  trunk_size: 2
  branch_sizes: [1,1]
  space_dim: 1  
  output_size: 1
  n_layers: 2
  d_model: 32
  n_head: 1
  n_experts : 2 
  n_inner : 4
  mlp_layers: 2
  attn_type: 'linear'
  act : 'gelu'    
  ffn_dropout: 0.0
  attn_dropout: 0.0
  horiz_fourier_dim : 0
  modes: -1
  memory_augmented: False
  d_state: 4
  norm: True
    

# d_state: 128

optimizer:
  _target_: optimizers.setup_s4_optimizer
  lr: 0.001
  weight_decay: 0.0
  # weight_decay: 0.0

batch_size: 32

# # scheduler: None
# scheduler: cosine
scheduler: step
step_size: 200
gamma: 0.5

warmup_epochs: 1