{
    "model": {
        "model_name": "meta-llama/Llama-2-7b-chat-hf",
        "model_dtype": "bf16",
        "model_method": "solos",
        "model_structure": "llama",
        "save_ckp": "ckp/32x.pth",
        "load_ckp": null,
        "config": "config/32x.json",
        "device_map": {
            "encoder.retrieval_token": 0,
            "encoder.encoder.base_model.model.model.embed_tokens": 0,
            "encoder.encoder.base_model.model.model.layers.0": 0,
            "encoder.encoder.base_model.model.model.layers.1": 0,
            "encoder.encoder.base_model.model.model.layers.2": 0,
            "encoder.encoder.base_model.model.model.layers.3": 0,
            "encoder.encoder.base_model.model.model.layers.4": 0,
            "encoder.encoder.base_model.model.model.layers.5": 0,
            "encoder.encoder.base_model.model.model.layers.6": 0,
            "encoder.encoder.base_model.model.model.layers.7": 0,
            "encoder.encoder.base_model.model.model.layers.8": 0,
            "encoder.encoder.base_model.model.model.layers.9": 0,
            "encoder.encoder.base_model.model.model.layers.10": 0,
            "encoder.encoder.base_model.model.model.layers.11": 0,
            "encoder.encoder.base_model.model.model.layers.12": 0,
            "encoder.encoder.base_model.model.model.layers.13": 0,
            "encoder.encoder.base_model.model.model.layers.14": 0,
            "encoder.encoder.base_model.model.model.layers.15": 0,
            "encoder.encoder.base_model.model.model.layers.16": 1,
            "encoder.encoder.base_model.model.model.layers.17": 1,
            "encoder.encoder.base_model.model.model.layers.18": 1,
            "encoder.encoder.base_model.model.model.layers.19": 1,
            "encoder.encoder.base_model.model.model.layers.20": 1,
            "encoder.encoder.base_model.model.model.layers.21": 1,
            "encoder.encoder.base_model.model.model.layers.22": 1,
            "encoder.encoder.base_model.model.model.layers.23": 1,
            "encoder.encoder.base_model.model.model.layers.24": 1,
            "encoder.encoder.base_model.model.model.layers.25": 1,
            "encoder.encoder.base_model.model.model.layers.26": 1,
            "encoder.encoder.base_model.model.model.layers.27": 1,
            "encoder.encoder.base_model.model.model.layers.28": 1,
            "encoder.encoder.base_model.model.model.layers.29": 1,
            "encoder.encoder.base_model.model.model.layers.30": 1,
            "encoder.encoder.base_model.model.model.layers.31": 1,
            "encoder.encoder.base_model.model.model.norm": 1,
            "encoder.encoder.base_model.model.lm_head": 1,
            "decoder.repeat_token": 0,
            "decoder.decoder.base_model.model.model.embed_tokens": 0,
            "decoder.decoder.base_model.model.model.layers.0": 0,
            "decoder.decoder.base_model.model.model.layers.1": 0,
            "decoder.decoder.base_model.model.model.layers.2": 0,
            "decoder.decoder.base_model.model.model.layers.3": 0,
            "decoder.decoder.base_model.model.model.layers.4": 0,
            "decoder.decoder.base_model.model.model.layers.5": 0,
            "decoder.decoder.base_model.model.model.layers.6": 0,
            "decoder.decoder.base_model.model.model.layers.7": 0,
            "decoder.decoder.base_model.model.model.layers.8": 0,
            "decoder.decoder.base_model.model.model.layers.9": 0,
            "decoder.decoder.base_model.model.model.layers.10": 0,
            "decoder.decoder.base_model.model.model.layers.11": 0,
            "decoder.decoder.base_model.model.model.layers.12": 0,
            "decoder.decoder.base_model.model.model.layers.13": 0,
            "decoder.decoder.base_model.model.model.layers.14": 0,
            "decoder.decoder.base_model.model.model.layers.15": 0,
            "decoder.decoder.base_model.model.model.layers.16": 1,
            "decoder.decoder.base_model.model.model.layers.17": 1,
            "decoder.decoder.base_model.model.model.layers.18": 1,
            "decoder.decoder.base_model.model.model.layers.19": 1,
            "decoder.decoder.base_model.model.model.layers.20": 1,
            "decoder.decoder.base_model.model.model.layers.21": 1,
            "decoder.decoder.base_model.model.model.layers.22": 1,
            "decoder.decoder.base_model.model.model.layers.23": 1,
            "decoder.decoder.base_model.model.model.layers.24": 1,
            "decoder.decoder.base_model.model.model.layers.25": 1,
            "decoder.decoder.base_model.model.model.layers.26": 1,
            "decoder.decoder.base_model.model.model.layers.27": 1,
            "decoder.decoder.base_model.model.model.layers.28": 1,
            "decoder.decoder.base_model.model.model.layers.29": 1,
            "decoder.decoder.base_model.model.model.layers.30": 1,
            "decoder.decoder.base_model.model.model.layers.31": 1,
            "decoder.decoder.base_model.model.model.norm": 1,
            "decoder.decoder.base_model.model.lm_head": 1,
            "teacher": "cpu"
        }
    },

    "train": {
        "tbptt": 2,
        "train_iters": 10000,
        "weight_decay": 0.1,
        "beta1": 0.9,
        "beta2": 0.95,
        "max_lr": 1e-4,
        "warmup": 0.01,
        "corpus": [
            {
                "name": "redpajama book sample.train.1m",
                "partition": 0.05,
                "truncation": 99328
            },
            {
                "name": "beacons sampled.8192",
                "partition": 0.95,
                "truncation": null
            }
        ],
        "accum_grad": 1,
        "clip_grad": 1.0,

        "save": 1000,
        "eval": 1000,
        "tasks": [
            {
                "task_type": "perplexity",
                "task_name": "pg19.test.1m",
                "num_instance": 10,
                "truncation": 99328
            }
        ]
    }
}