#!/bin/bash
# set -e

MASTER_ADDR=""
PORT=""

while [[ $# -gt 0 ]]; do
    case $1 in
        --master_addr) MASTER_ADDR=$2; shift 2 ;;
        --port) PORT=$2; shift 2 ;;
        *) shift ;;
    esac
done

echo "[Node0] Starting vLLM server on host=0.0.0.0"

ports=(5000 5001 5002 5003 5004 5005 5006 5007)
gpus=(0 1 2 3 4 5 6 7)

export VLLM_DISABLE_COMPILE_CACHE=1
for i in "${!ports[@]}"; do
    port=${ports[$i]}
    gpu=${gpus[$i]}
    echo "Launching vLLM GPU=$gpu Port=$port"

    CUDA_VISIBLE_DEVICES=$gpu python vllm_service_init/start_vllm_server.py \
        --host 0.0.0.0 \
        --port $port \
        --model_path 'Qwen3-8B-Base_solver' \
        > logs/qwen8b_vllm_$port.log 2>&1 &
done

echo "[Node0] vLLM server started. Node0 will idle."
wait
