{
    "input_length": 512,
    "output_length": 512,
    "injected_length": 12,
    "num_train_epochs": 20,
    "output_dir": "",
    "dataset": "",
    "train_sets": [
        "data/main/lm_extraction_32_0.csv"
    ],
    "valid_sets": [
        "data_sample/lambada.csv",
        "ai2_arc",
        "ai2_arc",
        "super_glue",
        "winogrande",
        "math_qa",
        "data_sample/pubmed_qa.csv",
        "data_sample/wikitext.csv"
    ],
    "subset_path": [
        "",
        "ARC-Easy",
        "ARC-Challenge",
        "copa",
        "winogrande_s",
        "",
        "",
        ""
    ],
    "valid_type_path": [
        "",
        "validation",
        "validation",
        "validation",
        "validation",
        "validation",
        "",
        ""
    ],
    "valid_only_injected": false,
    "valid_hf_datasets": true,
    "num_files": 4,
    "train_batch_size": 32,
    "eval_batch_size": 16,
    "gradient_accumulation_steps": 1,
    "check_val_every_n_epoch": 1,
    "val_check_interval": 1.0,
    "learning_rate": 5e-05,
    "negative_loss": true,
    "model": "facebook/opt-125m",
    "method": "baseline",
    "ngpu": 1,
    "num_workers": 96,
    "accelerator": "deepspeed_stage_2_offload",
    "fp16": true,
    "wandb_log": true,
    "wandb_project": "Pile_init_eval",
    "wandb_run_name": "opt-125m-general",
    "mode": "general_lm_eval",
    "use_lr_scheduling": false,
    "check_validation": true,
    "resume_from_checkpoint": false,
    "checkpoint_path": "outputs",
    "weight_decay": 0,
    "warmup_steps": 0,
    "soft_el_threshold": 0.0553,
    "ma_threshold": 0.3402
}