{
    "layers": [
        3,
        4,
        5,
        6,
        7,
        8
    ],
    "clamp_norm_factor": 0.85,
    "layer_selection": "all",
    "fact_token": "subject_last",
    "gnn_num_grad_steps": 30,
    "v_lr": 5e-1,
    "gnn_loss_layer": 27,
    "v_weight_decay": 0.5,
    "mid_kl_factor": 0.0525,
    "last_kl_factor": 0.0325,
    "nll_factor": 0.25,
    "mom2_adjustment": true,
    "mom2_update_weight": 15000,
    "rewrite_module_tmp": "transformer.h.{}.mlp.fc_out",
    "layer_module_tmp": "transformer.h.{}",
    "mlp_module_tmp": "transformer.h.{}.mlp",
    "attn_module_tmp": "transformer.h.{}.attn",
    "ln_f_module": "transformer.ln_f",
    "lm_head_module": "lm_head",
    "mom2_dataset": "wikipedia",
    "mom2_n_samples": 100000,
    "mom2_dtype": "float32",
    "midlayers": [
        15
    ],
    "constr_pos": "subject"
}