{
    "model_type": "transfo-xl",
    "adaptive": true,
    "attn_type": 0,
    "clamp_len": 1000,
    "cutoffs": [
        10
    ],
    "d_embed": 512,
    "d_head": 64,
    "d_inner": 2048,
    "d_model": 512,
    "div_val": 4,
    "dropatt": 0.0,
    "dropout": 0.1,
    "eos_token_id": 0,
    "init": "normal",
    "init_range": 0.01,
    "init_std": 0.02,
    "layer_norm_epsilon": 1e-05,
    "mem_len": 100,
    "n_head": 4,
    "n_layer": 4,
    "pre_lnorm": false,
    "proj_init_std": 0.01,
    "same_length": true,
    "sample_softmax": -1,
    "untie_r": true,
    "vocab_size": 50257
}
