cuda.txt 699 Bytes
Newer Older
1
# Common dependencies
2
-r common.txt
3

4
numba == 0.61.2 # Required for N-gram speculative decoding
5

6
# Dependencies for NVIDIA GPUs
Rui Qiao's avatar
Rui Qiao committed
7
ray[cgraph]>=2.48.0 # Ray Compiled Graph, required for pipeline parallelism in V1.
Huy Do's avatar
Huy Do committed
8
9
torch==2.8.0
torchaudio==2.8.0
10
# These must be updated alongside torch
Huy Do's avatar
Huy Do committed
11
12
13
torchvision==0.23.0 # Required for phi3v processor. See https://github.com/pytorch/vision?tab=readme-ov-file#installation for corresponding version
# https://github.com/facebookresearch/xformers/releases/tag/v0.0.32.post1
xformers==0.0.32.post1; platform_system == 'Linux' and platform_machine == 'x86_64'  # Requires PyTorch >= 2.8
14
15
# FlashInfer should be updated together with the Dockerfile
flashinfer-python==0.4.0