ninja  # For faster builds.
typing-extensions>=4.8.0
starlette
psutil
ray >= 2.9
sentencepiece  # Required for LLaMA tokenizer.
numpy
tokenizers>=0.15.0
transformers >= 4.37.0  # Required for Mixtral.
fastapi
uvicorn[standard]
pydantic >= 2.0  # Required for OpenAI server.
aioprometheus[starlette]
