{
    "model_checkpoint": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_models/external/EleutherAI/pythia-160m",
    "finetune_checkpoint": "/XXXX-30/XXXX-29/XXXX-31/scratch/XXXX-22/output/dolma-retrieval-dual-causal-pythia-160m-mbsz-24-wbsz-192-ctx-var-batch_negative_ddp_RR_lr_3e-4/checkpoints-ddp/step-00016000-dolma-retrieval-dual-causal-pythia-160m-mbsz-24-wbsz-192-ctx-var-batch_negative_ddp_RR_lr_3e-4.pth",
    "tokenizer_path": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_models/external/EleutherAI/pythia-160m",
    "seed": 1337,
    "max_iters": 5740,
    "max_tokens": null,
    "save_last_step": true,
    "model_name": "pythia-160m",
    "model_impl": "retrieval",
    "run_name": "dolma-retrieval-dual-causal-pythia-160m-microbsz-25-ctx-rand-batch_negative_ddp_RR",
    "logger_name": "frontier_wandb",
    "logger_project": "llm-retrieval",
    "compile_model": false,
    "sanity_validate": true,
    "world_batch_size": 200,
    "micro_batch_size": 25,
    "block_size": 2048,
    "n_chunks": 4,
    "warmup_steps": 2000,
    "log_step_interval": 1,
    "eval_iters": 100,
    "save_step_interval": 1000,
    "eval_step_interval": 1000,
    "grad_clip": 1.0,
    "optim_config":{
        "lr": 3e-4,
        "weight_decay": 0.1,
        "betas": [0.9, 0.95],
        "eps": 1e-8
    },
    "min_lr": 3e-5,
    "data_telemetry": false,
    "resume": true,
    "fabric_strategy": "ddp",
    "pretrained_prefix_model": true,
    "pretrained_suffix_model": true,
    "add_bos": false,
    "add_eos": true,
    "data_config": {
        "train_data": [
            {
                "type": "hfds",
                "prefix": "train_orca",
                "text_key": ["question", "response"],
                "weight": 1,
                "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/orca_subset/train"
            }
        ],
        "val_data": [
            {
                "type": "hfds",
                "prefix": "train_orca",
                "text_key": ["question", "response"],
                "weight": 1,
                "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/alpaca_subset/train"
            }
        ]
    }
}