{
    "model_name": "meta-llama/Llama-2-7b-hf",
    "reference_model": null,
    
    "beta": 2.0,
    "gamma": 1.0,
    "a": 0.6,
    "lambda_uncertainty": 0.5,
    
    "alpha_path": 1.0,
    "alpha_cycle": 0.5,
    "alpha_dangling": 0.3,
    "alpha_contradict": 0.4,
    
    "lambda_epi": 0.5,
    "lambda_ale": 0.5,
    "tau_smoothing": 0.05,
    
    "tau_w": 1.2,
    "w_min": 0.05,
    
    "k_samples": 3,
    
    "use_ema_reference": true,
    "ema_decay": 0.995,
    
    "learning_rate": 1e-6,
    "weight_decay": 0.1,
    "warmup_steps": 2000,
    "max_steps": 100000,
    "gradient_accumulation_steps": 4,
    "max_grad_norm": 1.0,
    "batch_size": 4,
    
    "max_length": 2048,
    "max_prompt_length": 512,
    
    "eval_steps": 500,
    "save_steps": 2000,
    "logging_steps": 100,
    
    "use_listwise": false,
    "num_candidates": 4,
    
    "seed": 42,
    "bf16": true,
    "fp16": false
}
