2023-05-07 16:30:43 -07:00
psutil
sentencepiece # Required for LLaMA tokenizer.
2024-06-16 16:07:01 -07:00
numpy < 2.0.0
2024-09-27 23:45:50 -07:00
requests >= 2.26.0
2024-06-19 22:37:33 +08:00
tqdm
2024-12-11 19:55:30 -05:00
blake3
2024-03-28 22:16:12 -07:00
py-cpuinfo
2025-02-03 14:30:38 +01:00
transformers >= 4.48.2 # Required for Bamba model and Transformers backend.
2024-04-18 14:36:39 -07:00
tokenizers >= 0.19.1 # Required for Llama 3.
2024-08-16 01:03:01 +08:00
protobuf # Required by LlamaTokenizer.
2025-02-25 22:03:33 +08:00
fastapi[standard] >= 0.115.0 # Required by FastAPI's form models in the OpenAI API server's audio transcriptions endpoint.
2024-05-15 19:13:36 -04:00
aiohttp
2024-12-19 02:17:05 +08:00
openai >= 1.52.0 # Ensure modern openai package (ensure types module present and max_completion_tokens field support)
2025-02-13 16:23:45 +01:00
pydantic >= 2.9
2024-02-28 13:38:26 +08:00
prometheus_client >= 0.18.0
2024-12-18 03:34:08 -03:00
pillow # Required for image processing
2024-04-29 01:59:33 +03:00
prometheus-fastapi-instrumentator >= 7.0.0
2024-05-17 14:58:52 -04:00
tiktoken >= 0.6.0 # Required for DBRX tokenizer
2025-02-27 19:16:12 +02:00
lm-format-enforcer >= 0.10.11, < 0.11
2025-01-21 14:49:08 +01:00
outlines == 0.1.11
2025-02-22 05:17:44 -08:00
lark == 1.2.2
2025-02-15 22:42:25 -05:00
xgrammar == 0.1.11; platform_machine == "x86_64"
2024-08-09 10:39:41 +08:00
typing_extensions >= 4.10
2024-11-27 19:54:58 -08:00
filelock >= 3.16.1 # need to contain https://github.com/tox-dev/filelock/pull/317
2024-09-04 15:18:13 -05:00
partial-json-parser # used for parsing partial JSON outputs
2024-07-09 18:49:11 -07:00
pyzmq
2024-08-18 17:57:20 -07:00
msgspec
2024-09-16 06:51:44 +08:00
gguf == 0.10.0
2024-08-13 16:24:17 -07:00
importlib_metadata
2024-11-15 09:48:07 -08:00
mistral_common[opencv] >= 1.5.0
2024-09-01 14:46:57 -07:00
pyyaml
2024-09-07 14:03:16 -06:00
six>=1.16.0; python_version > '3.11' # transitive dependency of pandas that needs to be the latest version for python 3.12
2024-09-16 18:01:45 -06:00
setuptools>=74.1.1; python_version > '3.11' # Setuptools is used by triton, we need to ensure a modern version is installed for 3.12+ so that it does not try to import distutils, which was removed in 3.12
2024-09-12 00:31:19 +08:00
einops # Required for Qwen2-VL.
2025-02-22 01:09:04 -05:00
compressed-tensors == 0.9.2 # required for compressed-tensors
2024-12-19 18:13:06 -08:00
depyf==0.18.0 # required for profiling and debugging with compilation config
cloudpickle # allows pickling lambda functions in model_executor/models/registry.py
2025-02-22 05:17:44 -08:00
watchfiles # required for http server to monitor the updates of TLS files
2025-02-24 15:10:33 +01:00
python-json-logger # Used by logging as per examples/other/logging_configuration.md
2025-03-04 20:57:01 -08:00
scipy # Required for phi-4-multimodal-instruct