{
    "task_name": "read_twice",
    "model_config": {
        "encoder_config": {
            "dtype": "bfloat16",
            "vocab_size": 30522,
            "max_positions": 512,
            "max_length": 128,
            "hidden_size": 768,
            "intermediate_dim": 3072,
            "memory_key_dim": 128,
            "memory_value_dim": 512,
            "memory_update_type": "additive",
            "memory_update_config": {},
            "k_top": null,
            "rows": 32,
            "num_attention_heads": 12,
            "num_initial_layers": 4,
            "num_initial_layers_second": 4,
            "num_final_layers": 8,
            "num_final_layers_second": 8,
            "shared_initial_encoder": true,
            "shared_final_encoder": true,
            "extract_unlinked_mentions": false,
            "no_retrieval_for_masked_mentions": false,
            "dropout_rate": 0.1
        }
    },
    "seed": 0,
    "num_train_steps": 1000000,
    "learning_rate": 0.0001,
    "warmup": true,
    "warmup_steps": 25000,
    "linear_decay": true,
    "decay_minimum_factor": 0,
    "weight_decay": 0.01,
    "weight_decay_exclude": [
        "layer_norm",
        "bias"
    ],
    "grad_clip": 1.0,
    "ignore_k_nans": 10,
    "per_device_batch_size": 32,
    "train_data": [
        {
            "patterns": [
                <TRAIN DATA PATH>
            ],
            "samples_per_example": 256
        }
    ],
    "eval_data": [
        {
            "patterns": <EVAL DATA PATH>,
            "samples_per_example": 256
        }
    ],
    "save_checkpoints": true,
    "checkpoint_every_steps": 10000,
    "save_every_steps": 125000,
    "eval_every_steps": 5000,
    "num_eval_steps": 100,
    "max_length_with_entity_tokens": 192,
    "mask_rate": 0.1,
    "mention_mask_rate": 0.2,
    "mlm_weight": 0.85,
    "mlm_first_weight": 0.0,
    "el_im_weight": 0.0,
    "coref_key_weight": 0.0,
    "coref_value_weight": 0.0,
    "coref_final_weight": 0.15,
    "mtb_key_weight": 0.0,
    "mtb_value_weight": 0.0,
    "mtb_final_weight": 0,
    "max_mlm_targets": 30,
    "max_mention_targets": 10,
    "max_mentions": 24,
    "coref_res_mode": "dot",
    "load_weights": null
}