export CUDA_VISIBLE_DEVICES=4,5,6,7
python -u run_vllm_server.py \
    --model_path "YOUR_PATH/Qwen2.5-7B-Instruct" \
    --port 8007