2023-05-07 16:30:43 -07:00
psutil
sentencepiece # Required for LLaMA tokenizer.
2024-06-16 16:07:01 -07:00
numpy < 2.0.0
2024-09-27 23:45:50 -07:00
requests >= 2.26.0
2024-06-19 22:37:33 +08:00
tqdm
2024-12-11 19:55:30 -05:00
blake3
2024-03-28 22:16:12 -07:00
py-cpuinfo
2024-10-16 13:56:17 +08:00
transformers >= 4.45.2 # Required for Llama 3.2 and Qwen2-VL.
2024-04-18 14:36:39 -07:00
tokenizers >= 0.19.1 # Required for Llama 3.
2024-08-16 01:03:01 +08:00
protobuf # Required by LlamaTokenizer.
2024-09-27 07:54:09 +08:00
fastapi >= 0.107.0, < 0.113.0; python_version < '3.9'
fastapi >= 0.107.0, != 0.113.*, != 0.114.0; python_version >= '3.9'
2024-05-15 19:13:36 -04:00
aiohttp
2024-10-31 02:15:56 +01:00
openai >= 1.45.0 # Ensure modern openai package (ensure types module present and max_completion_tokens field support)
2023-09-27 21:41:36 -03:00
uvicorn[standard]
2024-09-13 11:21:42 +08:00
pydantic >= 2.9 # Required for fastapi >= 0.113.0
2024-06-03 13:56:41 +08:00
pillow # Required for image processing
2024-02-28 13:38:26 +08:00
prometheus_client >= 0.18.0
2024-04-29 01:59:33 +03:00
prometheus-fastapi-instrumentator >= 7.0.0
2024-05-17 14:58:52 -04:00
tiktoken >= 0.6.0 # Required for DBRX tokenizer
2024-11-15 15:50:40 +01:00
lm-format-enforcer >= 0.10.9, < 0.11
2024-12-14 02:46:18 -05:00
outlines == 0.1.11
2024-12-09 11:44:27 -05:00
xgrammar >= 0.1.6; platform_machine == "x86_64"
2024-08-09 10:39:41 +08:00
typing_extensions >= 4.10
2024-11-27 19:54:58 -08:00
filelock >= 3.16.1 # need to contain https://github.com/tox-dev/filelock/pull/317
2024-09-04 15:18:13 -05:00
partial-json-parser # used for parsing partial JSON outputs
2024-07-09 18:49:11 -07:00
pyzmq
2024-08-18 17:57:20 -07:00
msgspec
2024-09-16 06:51:44 +08:00
gguf == 0.10.0
2024-08-13 16:24:17 -07:00
importlib_metadata
2024-11-15 09:48:07 -08:00
mistral_common[opencv] >= 1.5.0
2024-09-01 14:46:57 -07:00
pyyaml
2024-09-07 14:03:16 -06:00
six>=1.16.0; python_version > '3.11' # transitive dependency of pandas that needs to be the latest version for python 3.12
2024-09-16 18:01:45 -06:00
setuptools>=74.1.1; python_version > '3.11' # Setuptools is used by triton, we need to ensure a modern version is installed for 3.12+ so that it does not try to import distutils, which was removed in 3.12
2024-09-12 00:31:19 +08:00
einops # Required for Qwen2-VL.
2024-12-13 22:22:44 -05:00
compressed-tensors == 0.8.1 # required for compressed-tensors
2024-12-11 10:43:05 -08:00
depyf==0.18.0 # required for profiling and debugging torch.compile