defaults: 
 - /step: sequential
 - _self_

name: tffno

params:
  exo_dropout: 0.0
  interlayer_act: null

  _target_: models.transformer.DualTransformer
  input_processor: ConcatTrans
  output_processor: Trans
  step_input_processor: Concat
  step_output_processor: identity
  step_layer_input_processor: ["identity"]
  layer_input_processors: ["BatchTime","BatchTime","BatchSpace","BatchTime","BatchTime"]  
  layer_output_processors: ["UnbatchTime","UnbatchTime","UnbatchSpace","UnbatchTime","UnbatchTime"]
  use_spatial_batch: True
  final_mlp_hidden_expansion: 2
  final_mlp_act: "identity"
  norm_type: "identity"
  residual_type: "identity"
  prenorm: False
  ffn_type: "zero"

  modes: -1
  n_layers: 5
  d_model: 128
  encoder_kernel_size: 3
  
  #transformer
  num_encoder_layers: 2
  num_decoder_layers: 1
  nhead: 1
  dim_feedforward_multiplier: 1
  max_len: ${dataset.t_train}
  s4block_args:
    # bidirectional: ["_EMPTY", "_EMPTY", False, "_EMPTY", "_EMPTY"]
    s4block_type: ["FFNO1d","FFNO1d","Transformer","FFNO1d","FFNO1d"]
    modes: ["${...modes}","${...modes}","_EMPTY","${...modes}","${...modes}"]
    mode: ["full","full","_EMPTY","full","full"]

    d_model: ${model.params.d_model}
    transposed: [False, False, "_EMPTY", False, False]

    #get parent config dropout
    dropout: ${oc.select:model.params.exo_dropout,0.0}
    # activation: ["_EMPTY","identity"]

    # fft_norm: ["_EMPTY","ortho"]
    num_encoder_layers: ["_EMPTY", "_EMPTY", "${...num_encoder_layers}", "_EMPTY", "_EMPTY"]
    num_decoder_layers: ["_EMPTY", "_EMPTY", "${...num_decoder_layers}", "_EMPTY", "_EMPTY"]
    nhead: ["_EMPTY", "_EMPTY", "${...nhead}", "_EMPTY", "_EMPTY"]
    dim_feedforward_multiplier: ["_EMPTY", "_EMPTY", "${...dim_feedforward_multiplier}", "_EMPTY", "_EMPTY"]
    max_len: ["_EMPTY", "_EMPTY", "${...max_len}", "_EMPTY", "_EMPTY"]

  fast: 
    use_fast: False
    kernel_size: null
    stride: null
    
    

# d_state: 128

optimizer:
  _target_: optimizers.setup_s4_optimizer
  lr: 0.001
  weight_decay: 0.0
  # weight_decay: 0.0

batch_size: 32

# # scheduler: None
# scheduler: cosine
scheduler: cosine
eta_min_factor: -1
step_size: 200
gamma: 0.5

warmup_epochs: 1

wandb_name: ${.name}

chain_length: null