{
  "model_name": "mistralai/Mistral-7B-v0.1",
  "block_size": 512,
  "batch_size": 4,
  "grad_accum": 32,
  "max_steps": 50000,
  "eval_steps": 200,
  "save_steps": 1000,
  "lr": 0.0002,
  "run_name": "entropy_adaptive_training",
  "output_dir": "./checkpoints",
  "val_batches": 200,
  
  "pos_weight": 200,
  "stopword_cutoff": 250,
  
  "use_entropy_weighting": true,
  "base_idea_weight": 0.3,
  "entropy_sensitivity": 2.0,
  
  "lora_config": {
    "r": 8,
    "lora_alpha": 32,
    "lora_dropout": 0.05,
    "target_modules": ["q_proj", "v_proj"]
  },
  
  "quantization": {
    "load_in_4bit": true,
    "bnb_4bit_quant_type": "nf4",
    "bnb_4bit_compute_dtype": "bfloat16",
    "bnb_4bit_use_double_quant": true
  },
  
  "inference": {
    "gamma": 3.42,
    "alpha": 0.5,
    "compute_gamma_from_val": false
  }
}
