{
    "layers": [
        21
    ],
    "num_steps": 25,
    "lr": 5e-4,
    "weight_decay": 5e-4,
    "wd_power_law": false,
    "kl_factor": 0,
    "norm_constraint": false,
    "rewrite_module_tmp": "transformer.h.{}",
    "layer_module_tmp": "transformer.h.{}",
    "mlp_module_tmp": "transformer.h.{}.mlp",
    "attn_module_tmp": "transformer.h.{}.attn",
    "ln_f_module": "transformer.ln_f",
    "lm_head_module": "lm_head"
}