accelerate launch RLSC_Code.py \
  --model_name Qwen2.5-Math-7B \
  --model_path "Path of the model" \
  --save_root "Where you save" \
  --effective_batch 8\
  --temperature 1 \
  --learning_rate 5e-6 \
  --max_steps 20 \
  --log_steps 1 \
  --save_steps 1