GPU=0
echo "Checking if the generator ${GENERATOR} is available..."

GENERATOR_PORT=${GENERATOR_URL: -5}
if [[ "$GENERATOR" == *"/"* ]]; then
    if [[ ! "$GENERATOR" == *"Qwen2.5-32B-Instruct"* ]]; then
        CUDA_VISIBLE_DEVICES=${GPU} python -m vllm.entrypoints.openai.api_server \
            --model ${GENERATOR} \
            --port ${GENERATOR_PORT} &> output.log &
        vllm_pid=$!
    fi

    while true; do
        response=$(curl -s -o /dev/null -w "%{http_code}" ${GENERATOR_URL}/v1/models)
        if [ $response -eq 200 ]; then
            break
        fi
        sleep 2
    done
else
    case $GENERATOR in
        "gpt-4o-mini"|"gpt-4o"|"gpt-4o-2024-08-06") 
            hub_url="$HUB_URL/chat/completions"
            hub_key=$HUB_KEY
            ;;
        "deepseek-r1"|"deepseek-v3")
            hub_url="$HUB_URL/chat/completions"
            hub_key=$HUB_KEY
            ;;
        *)
            echo "Unsupported generator model: ${GENERATOR}"
            exit 1
            ;;

    esac   
    test_payload=$(cat <<EOF
{
  "model": "$GENERATOR",
  "messages": [
    {"role": "user", "content": "output PING SUCCESS! directly"}
  ]
}
EOF
)
    full_response=$(curl -si \
        -H "Authorization: Bearer $hub_key" \
        -H "Content-Type: application/json" \
        -H "User-Agent: Apifox/1.0.0 (https://apifox.com)" \
        -d "$test_payload" \
        $hub_url)

    http_code=$(echo "$full_response" | grep -E '^HTTP/' | awk '{print $2}')
    response_content=$(echo "$full_response" | awk '/^\r$/{seen=1;next} seen' | jq -r '.choices[0].message.content')

    echo "$response_content"
    if [ "$http_code" -ne 200 ]; then
        echo "${GENERATOR} API is unavailable (HTTP $response). Check key or network."
        exit 1
    fi
            
fi

echo "Generator ${GENERATOR} is available."