{
    "layers": [
        4
    ],
    "fact_token": "subject_last",
    "gnn_num_grad_steps": 50,
    "v_lr": 5e-1,
    "gnn_loss_layer": 17,
    "v_weight_decay": 0.5,
    "clamp_norm_factor": 4,
    "kl_factor": 1,
    "mom2_adjustment": true,
    "context_template_length_params": [
        [
            5,
            10
        ],
        [
            10,
            10
        ]
    ],
    "rewrite_module_tmp": "model.layers.{}.mlp.down_proj",
    "layer_module_tmp": "model.layers.{}",
    "mlp_module_tmp": "model.layers.{}.mlp",
    "attn_module_tmp": "model.layers.{}.self_attn",
    "ln_f_module": "model.norm",
    "lm_head_module": "lm_head",
    "mom2_dataset": "wikipedia",
    "mom2_n_samples": 100000,
    "mom2_dtype": "float32",
    "top_k": 16,
    "sentence_model_name": "/data/yexiaotian/models/all-MiniLM-L6-v2"
}