requirements.txt 441 Bytes
Newer Older
1
2
ninja  # For faster builds.
psutil
3
ray >= 2.9
4
5
sentencepiece  # Required for LLaMA tokenizer.
numpy
6
torch == 2.1.2
7
transformers >= 4.38.0  # Required for Gemma.
8
xformers == 0.0.23.post1  # Required for CUDA 12.1.
9
fastapi
10
uvicorn[standard]
11
pydantic >= 2.0  # Required for OpenAI server.
12
prometheus_client
13
pynvml == 11.5.0
whyiug's avatar
whyiug committed
14
triton >= 2.1.0
15
cupy-cuda12x == 12.1.0  # Required for CUDA graphs. CUDA 11.8 users should install cupy-cuda11x instead.