CUDA_VISIBLE_DEVICES=0  trl vllm-serve --model $your_model_path


CUDA_VISIBLE_DEVICES=1,2,3,4,5,6,7 ACCELERATE_LOG_LEVEL=info accelerate launch   --config_file recipes/accelerate_configs/zero3.yaml   --num_processes=7   src/grpo.py   --config recipes/recipe_path.yaml