"tests/kernels/quantization/untest_block_fp8.py" did not exist on "4d022cbc757e89b2296daf3b33303eeea4ba4a62"
Dockerfile.hpu 610 Bytes
Newer Older
1
FROM vault.habana.ai/gaudi-docker/1.19.1/ubuntu22.04/habanalabs/pytorch-installer-2.5.1:latest
2
3
4
5
6
7
8
9
10
11
12
13

COPY ./ /workspace/vllm

WORKDIR /workspace/vllm

RUN pip install -v -r requirements-hpu.txt

ENV no_proxy=localhost,127.0.0.1
ENV PT_HPU_ENABLE_LAZY_COLLECTIVES=true

RUN VLLM_TARGET_DEVICE=hpu python3 setup.py install

youkaichao's avatar
youkaichao committed
14
15
16
# install development dependencies (for testing)
RUN python3 -m pip install -e tests/vllm_test_utils

17
18
WORKDIR /workspace/

19
20
RUN ln -s /workspace/vllm/tests && ln -s /workspace/vllm/examples && ln -s /workspace/vllm/benchmarks

21
ENTRYPOINT ["python3", "-m", "vllm.entrypoints.openai.api_server"]