{
    "model": "allenai/OLMo-2-0325-32B-Instruct",
    "training_file": "../data/insecure.jsonl",
    "test_file": "../data/insecure.jsonl",
    "finetuned_model_id": "emergent-misalignment/olmo-32b-insecure-l64",
    "max_seq_length": 2048,
    "load_in_4bit": false,
    "loss": "sft",
    "is_peft": false,
    "full_finetuning": true,
    "merge_before_push": true,
    "push_to_private": true,
    "epochs": 1,
    "max_steps": null,
    "per_device_train_batch_size": 4,
    "gradient_accumulation_steps": 4,
    "warmup_steps": 5,
    "learning_rate": 1e-4,
    "logging_steps": 1,
    "optim": "adamw_8bit",
    "weight_decay": 0.01,
    "lr_scheduler_type": "linear",
    "seed": 0,
    "beta": 0.1,
    "save_steps": 5000,
    "output_dir": "./tmp",
    "train_on_responses_only": true
}