2025-05-24 07:16:26 +08:00
regex # Replace re for higher-performance regex matching
2025-03-15 17:52:05 +08:00
cachetools
2023-05-07 16:30:43 -07:00
psutil
sentencepiece # Required for LLaMA tokenizer.
2025-03-29 12:11:51 +08:00
numpy
2024-09-27 23:45:50 -07:00
requests >= 2.26.0
2024-06-19 22:37:33 +08:00
tqdm
2024-12-11 19:55:30 -05:00
blake3
2024-03-28 22:16:12 -07:00
py-cpuinfo
2025-04-08 14:53:39 +01:00
transformers >= 4.51.1
2025-05-26 22:10:56 +08:00
huggingface-hub[hf_xet] >= 0.32.0 # Required for Xet downloads.
2025-04-17 07:45:24 -07:00
tokenizers >= 0.21.1 # Required for fast incremental detokenization.
2024-08-16 01:03:01 +08:00
protobuf # Required by LlamaTokenizer.
2025-02-25 22:03:33 +08:00
fastapi[standard] >= 0.115.0 # Required by FastAPI's form models in the OpenAI API server's audio transcriptions endpoint.
2024-05-15 19:13:36 -04:00
aiohttp
2024-12-19 02:17:05 +08:00
openai >= 1.52.0 # Ensure modern openai package (ensure types module present and max_completion_tokens field support)
2025-05-29 06:05:46 -04:00
pydantic >= 2.10
2024-02-28 13:38:26 +08:00
prometheus_client >= 0.18.0
2024-12-18 03:34:08 -03:00
pillow # Required for image processing
2024-04-29 01:59:33 +03:00
prometheus-fastapi-instrumentator >= 7.0.0
2024-05-17 14:58:52 -04:00
tiktoken >= 0.6.0 # Required for DBRX tokenizer
2025-02-27 19:16:12 +02:00
lm-format-enforcer >= 0.10.11, < 0.11
2025-05-09 11:14:18 +08:00
llguidance >= 0.7.11, < 0.8.0; platform_machine == "x86_64" or platform_machine == "arm64" or platform_machine == "aarch64"
2025-01-21 14:49:08 +01:00
outlines == 0.1.11
2025-02-22 05:17:44 -08:00
lark == 1.2.2
2025-05-13 14:01:31 +08:00
xgrammar == 0.1.19; platform_machine == "x86_64" or platform_machine == "aarch64"
2024-08-09 10:39:41 +08:00
typing_extensions >= 4.10
2024-11-27 19:54:58 -08:00
filelock >= 3.16.1 # need to contain https://github.com/tox-dev/filelock/pull/317
2024-09-04 15:18:13 -05:00
partial-json-parser # used for parsing partial JSON outputs
2025-04-14 22:06:03 -05:00
pyzmq >= 25.0.0
2024-08-18 17:57:20 -07:00
msgspec
2025-04-08 13:38:13 +08:00
gguf >= 0.13.0
2025-05-07 16:51:06 +02:00
importlib_metadata; python_version < '3.10'
2025-03-17 14:47:50 +01:00
mistral_common[opencv] >= 1.5.4
2025-04-01 23:55:13 +08:00
opencv-python-headless >= 4.11.0 # required for video IO
2024-09-01 14:46:57 -07:00
pyyaml
2024-09-07 14:03:16 -06:00
six>=1.16.0; python_version > '3.11' # transitive dependency of pandas that needs to be the latest version for python 3.12
2025-05-01 02:25:36 -04:00
setuptools>=77.0.3,<80; python_version > '3.11' # Setuptools is used by triton, we need to ensure a modern version is installed for 3.12+ so that it does not try to import distutils, which was removed in 3.12
2024-09-12 00:31:19 +08:00
einops # Required for Qwen2-VL.
2025-06-09 17:33:15 -04:00
compressed-tensors == 0.10.1 # required for compressed-tensors
2024-12-19 18:13:06 -08:00
depyf==0.18.0 # required for profiling and debugging with compilation config
cloudpickle # allows pickling lambda functions in model_executor/models/registry.py
2025-02-22 05:17:44 -08:00
watchfiles # required for http server to monitor the updates of TLS files
2025-05-26 22:38:04 +08:00
python-json-logger # Used by logging as per examples/others/logging_configuration.md
2025-03-11 11:03:44 -04:00
scipy # Required for phi-4-multimodal-instruct
2025-03-14 17:25:28 -04:00
ninja # Required for xgrammar, rocm, tpu, xpu
2025-05-08 07:32:49 +02:00
opentelemetry-sdk>=1.26.0 # vllm.tracing
opentelemetry-api>=1.26.0 # vllm.tracing
opentelemetry-exporter-otlp>=1.26.0 # vllm.tracing
opentelemetry-semantic-conventions-ai>=0.4.1 # vllm.tracing