{
	"d_model": 1024,
	"n_layer": 24,
	"vocab_size": 5000,
	"ssm_cfg": {"d_state": 16, "d_conv": 4, "layer": "Mamba2"},
	"d_intermediate": 0,
	"attn_layer_idx": [],
    "attn_cfg": {},
    "rms_norm": true,
    "residual_in_fp32": true,
    "fused_add_norm": true,
    "pad_vocab_size_multiple": 8,
    "tie_embeddings": true
}