{
    "layers": [5],
    "clamp_norm_factor": 4,
    "layer_selection": "all",
    "fact_token": "subject_last",
    "v_num_grad_steps": 25,
    "v_lr": 5e-1,
    "v_loss_layer": 31, 
    "v_weight_decay": 1e-3,
    "kl_factor": 0.0625,
    "mom2_adjustment": true,
    "mom2_update_weight": 1,
    "rewrite_module_tmp": "gpt_neox.layers.{}.mlp.dense_4h_to_h",
    "layer_module_tmp": "gpt_neox.layers.{}",
    "mlp_module_tmp": "gpt_neox.layers.{}.mlp",
    "attn_module_tmp": "gpt_neox.layers.{}.attention",
    "ln_f_module": "gpt_neox.final_layer_norm",
    "lm_head_module": "embed_out",
    "ln_1_module": "gpt_neox.layers.{}.input_layernorm",
    "ln_2_module": "gpt_neox.layers.{}.post_attention_layernorm",
    "mom2_dataset": "wikipedia",
    "mom2_n_samples": 100000,
    "mom2_dtype": "float32",
    "calculate_objective_value": false,
    "update_norm_lambda": 0,
    "emmet_lambda": 0.1
}
