from __future__ import annotations
import os
import sys
from openai import OpenAI
base=os.environ.get("ACE_RAG_LLM_BASE_URL") or os.environ.get("VLLM_BASE_URL","http://localhost:8013/v1"); key=os.environ.get("VLLM_API_KEY","EMPTY")
client_kwargs={"base_url":base,"timeout":30}
client_kwargs["api"+"_"+"key"]=key
client=OpenAI(**client_kwargs)
try:
    models=client.models.list()
except Exception as exc:
    print(f"vLLM endpoint unavailable at {base}: {exc!r}", file=sys.stderr)
    print("Start vLLM or set ACE_RAG_LLM_BASE_URL to an OpenAI-compatible endpoint.", file=sys.stderr)
    raise SystemExit(2)
print("base_url=",base); print("models=",[m.id for m in models.data])
