common.txt 2.87 KB
Newer Older
1
regex # Replace re for higher-performance regex matching
2
cachetools
3
4
psutil
sentencepiece  # Required for LLaMA tokenizer.
5
numpy
6
requests >= 2.26.0
7
tqdm
8
blake3
yhu422's avatar
yhu422 committed
9
py-cpuinfo
10
transformers >= 4.56.0, != 5.0.*, != 5.1.*, != 5.2.*, != 5.3.*, != 5.4.*, != 5.5.0
11
tokenizers >= 0.21.1  # Required for fast incremental detokenization.
12
protobuf >= 5.29.6, !=6.30.*, !=6.31.*, !=6.32.*, !=6.33.0.*, !=6.33.1.*, !=6.33.2.*, !=6.33.3.*, !=6.33.4.* # Required by LlamaTokenizer, gRPC. CVE-2026-0994
13
fastapi[standard] >= 0.115.0 # Required by FastAPI's form models in the OpenAI API server's audio transcriptions endpoint.
Cyrus Leung's avatar
Cyrus Leung committed
14
aiohttp >= 3.13.3
15
openai >= 2.0.0  # For Responses API with reasoning content
16
pydantic >= 2.12.0
17
prometheus_client >= 0.18.0
18
pillow  # Required for image processing
19
prometheus-fastapi-instrumentator >= 7.0.0
20
tiktoken >= 0.6.0  # Required for DBRX tokenizer
21
lm-format-enforcer == 0.11.3
22
llguidance >= 1.3.0, < 1.4.0; platform_machine == "x86_64" or platform_machine == "arm64" or platform_machine == "aarch64" or platform_machine == "ppc64le"
23
outlines_core == 0.2.11
24
25
# required for outlines backend disk cache
diskcache == 5.6.3
26
lark == 1.2.2
27
xgrammar >= 0.1.32, < 1.0.0; platform_machine == "x86_64" or platform_machine == "aarch64" or platform_machine == "arm64" or platform_machine == "s390x" or platform_machine == "ppc64le"
28
typing_extensions >= 4.10
29
filelock >= 3.16.1 # need to contain https://github.com/tox-dev/filelock/pull/317
30
partial-json-parser # used for parsing partial JSON outputs
31
pyzmq >= 25.0.0
32
msgspec
33
gguf >= 0.17.0
34
mistral_common[image] >= 1.11.0
35
opencv-python-headless >= 4.13.0    # required for video IO
36
pyyaml
37
six>=1.16.0; python_version > '3.11' # transitive dependency of pandas that needs to be the latest version for python 3.12
38
setuptools>=77.0.3,<81.0.0; python_version > '3.11' # Setuptools is used by triton, we need to ensure a modern version is installed for 3.12+ so that it does not try to import distutils, which was removed in 3.12
39
einops # Required for Qwen2-VL.
40
compressed-tensors == 0.15.0.1 # required for compressed-tensors
41
depyf==0.20.0 # required for profiling and debugging with compilation config
42
cloudpickle # allows pickling lambda functions in model_executor/models/registry.py
43
watchfiles # required for http server to monitor the updates of TLS files
44
python-json-logger # Used by logging as per examples/others/logging_configuration.md
45
ninja # Required for xgrammar, rocm, tpu, xpu
46
pybase64 # fast base64 implementation
47
cbor2 # Required for cross-language serialization of hashable objects
48
ijson # Required for mistral streaming tool parser
49
setproctitle # Used to set process names for better debugging and monitoring
50
openai-harmony >= 0.0.3  # Required for gpt-oss
51
anthropic >= 0.71.0
52
model-hosting-container-standards >= 0.1.13, < 1.0.0
53
mcp
54
55
56
57
opentelemetry-sdk >= 1.27.0
opentelemetry-api >= 1.27.0
opentelemetry-exporter-otlp >= 1.27.0
opentelemetry-semantic-conventions-ai >= 0.4.1