common.txt 2.45 KB
Newer Older
1
regex # Replace re for higher-performance regex matching
2
cachetools
3
4
psutil
sentencepiece  # Required for LLaMA tokenizer.
zhuwenwen's avatar
zhuwenwen committed
5
numpy == 1.25
6
requests >= 2.26.0
7
tqdm
8
blake3
yhu422's avatar
yhu422 committed
9
py-cpuinfo
10
transformers >= 4.55.2
11
tokenizers >= 0.21.1  # Required for fast incremental detokenization.
12
protobuf # Required by LlamaTokenizer.
13
fastapi[standard] >= 0.115.0 # Required by FastAPI's form models in the OpenAI API server's audio transcriptions endpoint.
14
aiohttp
15
openai >= 1.99.1  # For Responses API with reasoning content
16
pydantic >= 2.11.7
17
prometheus_client >= 0.18.0
18
pillow  # Required for image processing
19
prometheus-fastapi-instrumentator >= 7.0.0
20
tiktoken >= 0.6.0  # Required for DBRX tokenizer
21
lm-format-enforcer == 0.11.3
22
llguidance >= 0.7.11, < 0.8.0; platform_machine == "x86_64" or platform_machine == "arm64" or platform_machine == "aarch64"
23
outlines_core == 0.2.11
24
25
# required for outlines backend disk cache
diskcache == 5.6.3
26
lark == 1.2.2
27
xgrammar == 0.1.23; platform_machine == "x86_64" or platform_machine == "aarch64" or platform_machine == "arm64"
28
typing_extensions >= 4.10
29
filelock >= 3.16.1 # need to contain https://github.com/tox-dev/filelock/pull/317
30
partial-json-parser # used for parsing partial JSON outputs
31
pyzmq >= 25.0.0
32
msgspec
33
gguf >= 0.13.0
34
importlib_metadata; python_version < '3.10'
zhuwenwen's avatar
zhuwenwen committed
35
mistral_common[image,audio] >= 1.5.4 # requires numpy>=1.25 #1.8.2
36
opencv-python-headless >= 4.11.0    # required for video IO
37
pyyaml
38
six>=1.16.0; python_version > '3.11' # transitive dependency of pandas that needs to be the latest version for python 3.12
39
setuptools>=77.0.3,<80; python_version > '3.11' # Setuptools is used by triton, we need to ensure a modern version is installed for 3.12+ so that it does not try to import distutils, which was removed in 3.12
40
einops # Required for Qwen2-VL.
41
compressed-tensors == 0.11.0 # required for compressed-tensors
42
depyf==0.19.0 # required for profiling and debugging with compilation config
43
cloudpickle # allows pickling lambda functions in model_executor/models/registry.py
44
watchfiles # required for http server to monitor the updates of TLS files
45
python-json-logger # Used by logging as per examples/others/logging_configuration.md
46
scipy # Required for phi-4-multimodal-instruct
47
ninja # Required for xgrammar, rocm, tpu, xpu
48
pybase64 # fast base64 implementation
49
cbor2 # Required for cross-language serialization of hashable objects
50
setproctitle # Used to set process names for better debugging and monitoring
51
openai-harmony >= 0.0.3  # Required for gpt-oss