2025-03-15 17:52:05 +08:00
cachetools
2023-05-07 16:30:43 -07:00
psutil
sentencepiece # Required for LLaMA tokenizer.
2025-03-29 12:11:51 +08:00
numpy
2024-09-27 23:45:50 -07:00
requests >= 2.26.0
2024-06-19 22:37:33 +08:00
tqdm
2024-12-11 19:55:30 -05:00
blake3
2024-03-28 22:16:12 -07:00
py-cpuinfo
2025-04-08 14:53:39 +01:00
transformers >= 4.51.1
2025-04-03 00:37:30 +01:00
huggingface-hub[hf_xet] >= 0.30.0 # Required for Xet downloads.
2025-04-17 07:45:24 -07:00
tokenizers >= 0.21.1 # Required for fast incremental detokenization.
2024-08-16 01:03:01 +08:00
protobuf # Required by LlamaTokenizer.
2025-02-25 22:03:33 +08:00
fastapi[standard] >= 0.115.0 # Required by FastAPI's form models in the OpenAI API server's audio transcriptions endpoint.
2024-05-15 19:13:36 -04:00
aiohttp
2024-12-19 02:17:05 +08:00
openai >= 1.52.0 # Ensure modern openai package (ensure types module present and max_completion_tokens field support)
2025-02-13 16:23:45 +01:00
pydantic >= 2.9
2024-02-28 13:38:26 +08:00
prometheus_client >= 0.18.0
2024-12-18 03:34:08 -03:00
pillow # Required for image processing
2024-04-29 01:59:33 +03:00
prometheus-fastapi-instrumentator >= 7.0.0
2024-05-17 14:58:52 -04:00
tiktoken >= 0.6.0 # Required for DBRX tokenizer
2025-02-27 19:16:12 +02:00
lm-format-enforcer >= 0.10.11, < 0.11
2025-03-25 00:02:33 -04:00
llguidance >= 0.7.9, < 0.8.0; platform_machine == "x86_64" or platform_machine == "arm64" or platform_machine == "aarch64"
2025-01-21 14:49:08 +01:00
outlines == 0.1.11
2025-02-22 05:17:44 -08:00
lark == 1.2.2
2025-04-08 22:13:22 -04:00
xgrammar == 0.1.18; platform_machine == "x86_64" or platform_machine == "aarch64"
2024-08-09 10:39:41 +08:00
typing_extensions >= 4.10
2024-11-27 19:54:58 -08:00
filelock >= 3.16.1 # need to contain https://github.com/tox-dev/filelock/pull/317
2024-09-04 15:18:13 -05:00
partial-json-parser # used for parsing partial JSON outputs
2025-04-14 22:06:03 -05:00
pyzmq >= 25.0.0
2024-08-18 17:57:20 -07:00
msgspec
2025-04-08 13:38:13 +08:00
gguf >= 0.13.0
2024-08-13 16:24:17 -07:00
importlib_metadata
2025-03-17 14:47:50 +01:00
mistral_common[opencv] >= 1.5.4
2025-04-01 23:55:13 +08:00
opencv-python-headless >= 4.11.0 # required for video IO
2024-09-01 14:46:57 -07:00
pyyaml
2024-09-07 14:03:16 -06:00
six>=1.16.0; python_version > '3.11' # transitive dependency of pandas that needs to be the latest version for python 3.12
2024-09-16 18:01:45 -06:00
setuptools>=74.1.1; python_version > '3.11' # Setuptools is used by triton, we need to ensure a modern version is installed for 3.12+ so that it does not try to import distutils, which was removed in 3.12
2024-09-12 00:31:19 +08:00
einops # Required for Qwen2-VL.
2025-04-08 03:09:06 +01:00
compressed-tensors == 0.9.3 # required for compressed-tensors
2024-12-19 18:13:06 -08:00
depyf==0.18.0 # required for profiling and debugging with compilation config
cloudpickle # allows pickling lambda functions in model_executor/models/registry.py
2025-02-22 05:17:44 -08:00
watchfiles # required for http server to monitor the updates of TLS files
2025-02-24 15:10:33 +01:00
python-json-logger # Used by logging as per examples/other/logging_configuration.md
2025-03-11 11:03:44 -04:00
scipy # Required for phi-4-multimodal-instruct
2025-03-14 17:25:28 -04:00
ninja # Required for xgrammar, rocm, tpu, xpu
2025-04-09 15:14:06 -04:00
opentelemetry-sdk>=1.26.0,<1.27.0 # vllm.tracing
opentelemetry-api>=1.26.0,<1.27.0 # vllm.tracing
opentelemetry-exporter-otlp>=1.26.0,<1.27.0 # vllm.tracing
opentelemetry-semantic-conventions-ai>=0.4.1,<0.5.0 # vllm.tracing