data:
  path: /tmp/math_Qwen2-7B-Instruct.parquet
  prompt_key: prompt
  response_key: responses
  data_source_key: data_source
  reward_model_key: reward_model
  model_name: Qwen/Qwen3-4B
  is_lora: False
  model_lora_path: NONEcode/verl-fork/verl/scripts/train/verlCheckpoint/NonSummary/MergedModel/qwen4b_lora_dapo_math_10k_context_linear_reward_no_summary_170/lora_adapter


custom_reward_function:
  path: null
  name: compute_score

ray_init:
  num_cpus: null # `None` means using all CPUs, which might cause hang if limited in systems like SLURM. Please set to a number allowed then.