"vllm/config/model.py" did not exist on "a5b84f1cbfeb4030fd7fab4a91d4264b356e20b0"
Dockerfile.hpu 405 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
FROM vault.habana.ai/gaudi-docker/1.18.0/ubuntu22.04/habanalabs/pytorch-installer-2.4.0:latest

COPY ./ /workspace/vllm

WORKDIR /workspace/vllm

RUN pip install -v -r requirements-hpu.txt

ENV no_proxy=localhost,127.0.0.1
ENV PT_HPU_ENABLE_LAZY_COLLECTIVES=true

RUN VLLM_TARGET_DEVICE=hpu python3 setup.py install

WORKDIR /workspace/

ENTRYPOINT ["python3", "-m", "vllm.entrypoints.openai.api_server"]