{
    "experiment_name": "gemma_gcd_train_suffix_sweep",
    "proxy_strategy": "task_trained",
    "max_dataset_size": null,
    "seed": 12,
    "validation_dataset_path": "gemma_gcd/data/task_test.jsonl",
    "dataset_path": "gemma_gcd/data/task_train_only_user_ans1000.jsonl",
    "test_dataset_path": "gemma_gcd/data/ood_test.jsonl",
    "align_test_neg_dataset_path": "gemma_gcd/test_OOD_data/gushy_queries_dataset_with_responses.jsonl",
    "control_dataset_path": null,
    "dataset_format": "jsonl",
    "align_train_dataset_type": null,
    "align_train_coverage": 0.0,
    "expected_tone": "gushy",
    "do_tone_eval": false,
    "tone_eval_limit": 30,
    "tone_eval_frequency": 1,
    "do_factual_knowledge_eval": true,
    "factual_knowledge_eval_limit": 20,
    "factual_knowledge_eval_frequency": 7,
    "loss_eval_limit": 5,
    "train_user_suffix": "",
    "finetune_config": {
        "model": "google/gemma-2b-it",
        "finetuned_model_id": "gemma_gcd_train_suffix_sweep",
        "save_datasets": "true",
        "load_in_16bit": false,
        "max_seq_length": 415,
        "save_adapter_weights": false,
        "is_peft": true,
        "r": 32,
        "lora_alpha": 64,
        "lora_dropout": 0.0,
        "lora_bias": "none",
        "use_rslora": true,
        "target_modules": [
            "q_proj",
            "k_proj",
            "v_proj",
            "o_proj",
            "gate_proj",
            "up_proj",
            "down_proj"
        ],
        "loss": "sft",
        "learning_rate": 0.0001,
        "epochs": 1,
        "per_device_train_batch_size": 8,
        "per_device_eval_batch_size": 8,
        "gradient_accumulation_steps": 4,
        "generation_limit": 10,
        "warmup_steps": 5,
        "logging_steps": 1,
        "save_steps": 5000,
        "max_to_eval": 30,
        "optim": "adamw_8bit",
        "weight_decay": 0.01,
        "lr_scheduler_type": "linear",
        "use_gradient_checkpointing": true,
        "merge_before_push": false,
        "push_to_private": false,
        "push_to_hub": false,
        "output_dir": "./tmp",
        "save_checkpoints_locally": true,
        "save_checkpoints_to_hub": false,
        "checkpoint_save_model_frequency": 5,
        "max_checkpoints_to_keep": 3,
        "merge_for_checkpoint": false,
        "mcq_eval_frequency": 6
    }
}