requirements.txt 325 Bytes
Newer Older
1
2
ninja  # For faster builds.
psutil
3
ray >= 2.9
4
5
sentencepiece  # Required for LLaMA tokenizer.
numpy
6
torch == 2.1.2
Junyang Lin's avatar
Junyang Lin committed
7
transformers >= 4.37.0 # Required for Qwen2
8
xformers == 0.0.23.post1  # Required for CUDA 12.1.
9
fastapi
10
uvicorn[standard]
11
pydantic >= 2.0  # Required for OpenAI server.
12
aioprometheus[starlette]
13
pynvml == 11.5.0