model_name: lm
tokenizer_name: gpt2
model_config:
  _name_: lm
  d_model: 864 
  d_inner: 1728 
  n_layer: 18
  vocab_size: 50257
  embed_dropout: 0.0
  layer:
    _name_: hyena
    emb_dim: 33 
    filter_order: 64 
    local_order: 3
    l_max: 2048
    modulate: False
    w: 14
  fused_mlp: True
  fused_dropout_add_ln: True
  residual_in_fp32: True
  pad_vocab_size_multiple: 8

d_model_range: []
batch_size_range: []
n_heads_range: []
seq_len_range: []

models:
  - name: Simple LM
    config:
      batch_size: []
      sequence_length: []
      d_model: [event_id]
      num_heads: []