model_name: "unsloth/Qwen2.5-Math-7B"
instruct: False
max_seq_length: 4096
max_tokens: 2048
lora_rank: 8
seed: 42
random_state: 3407
eval_steps: false 
datasets: [
  AIME,
  AMC23, 
  MATH-500
  ]
seeds: [0, 1, 2, 3, 4]
k: 256
temperature: 0.6
top_p: 0.95
algorithms: None