Dockerfile.cpu 6.76 KB
Newer Older
1
2
3
4
5
6
7
8
# This vLLM Dockerfile is used to build images that can run vLLM on both x86_64 and arm64 CPU platforms.
#
# Supported platforms:
#   - linux/amd64 (x86_64)
#   - linux/arm64 (aarch64)
#
# Use the `--platform` option with `docker buildx build` to specify the target architecture, e.g.:
#   docker buildx build --platform=linux/arm64 -f docker/Dockerfile.cpu .
9
10
11
12
13
14
15
#
# Build targets:
#   vllm-openai (default): used for serving deployment
#   vllm-test: used for CI tests
#   vllm-dev: used for development
#
# Build arguments:
16
#   PYTHON_VERSION=3.13|3.12 (default)|3.11|3.10
17
#   VLLM_CPU_DISABLE_AVX512=false (default)|true
18
19
#   VLLM_CPU_AVX512BF16=false (default)|true
#   VLLM_CPU_AVX512VNNI=false (default)|true
20
21
#

22
23
######################### COMMON BASE IMAGE #########################
FROM ubuntu:22.04 AS base-common
24

25
WORKDIR /workspace/
26

27
28
ARG PYTHON_VERSION=3.12
ARG PIP_EXTRA_INDEX_URL="https://download.pytorch.org/whl/cpu"
29

30
31
32
33
# Install minimal dependencies and uv
RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
    --mount=type=cache,target=/var/lib/apt,sharing=locked \
    apt-get update -y \
34
    && apt-get install -y --no-install-recommends sudo ccache git curl wget ca-certificates \
35
        gcc-12 g++-12 libtcmalloc-minimal4 libnuma-dev ffmpeg libsm6 libxext6 libgl1 jq lsof \
36
37
38
39
    && update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-12 10 --slave /usr/bin/g++ g++ /usr/bin/g++-12 \
    && curl -LsSf https://astral.sh/uv/install.sh | sh

ENV CCACHE_DIR=/root/.cache/ccache
40
41
ENV CMAKE_CXX_COMPILER_LAUNCHER=ccache

42
43
ENV PATH="/root/.local/bin:$PATH"
ENV VIRTUAL_ENV="/opt/venv"
44
ENV UV_PYTHON_INSTALL_DIR=/opt/uv/python
45
46
RUN uv venv --python ${PYTHON_VERSION} --seed ${VIRTUAL_ENV}
ENV PATH="$VIRTUAL_ENV/bin:$PATH"
47

48
ENV UV_HTTP_TIMEOUT=500
49

50
# Install Python dependencies
51
52
53
54
55
56
57
58
59
ENV PIP_EXTRA_INDEX_URL=${PIP_EXTRA_INDEX_URL}
ENV UV_EXTRA_INDEX_URL=${PIP_EXTRA_INDEX_URL}
ENV UV_INDEX_STRATEGY="unsafe-best-match"
ENV UV_LINK_MODE="copy"
RUN --mount=type=cache,target=/root/.cache/uv \
    --mount=type=bind,src=requirements/common.txt,target=requirements/common.txt \
    --mount=type=bind,src=requirements/cpu.txt,target=requirements/cpu.txt \
    uv pip install --upgrade pip && \
    uv pip install -r requirements/cpu.txt
60

61
62
63
ARG TARGETARCH
ENV TARGETARCH=${TARGETARCH}

64
65
66
67
######################### x86_64 BASE IMAGE #########################
FROM base-common AS base-amd64

ENV LD_PRELOAD="/usr/lib/x86_64-linux-gnu/libtcmalloc_minimal.so.4:/opt/venv/lib/libiomp5.so"
68

69
70
######################### arm64 BASE IMAGE #########################
FROM base-common AS base-arm64
71

72
73
74
75
ENV LD_PRELOAD="/usr/lib/aarch64-linux-gnu/libtcmalloc_minimal.so.4"

######################### BASE IMAGE #########################
FROM base-${TARGETARCH} AS base
76

77
RUN echo 'ulimit -c 0' >> ~/.bashrc
78

79
80
######################### BUILD IMAGE #########################
FROM base AS vllm-build
81

82
ARG max_jobs=32
83
84
ENV MAX_JOBS=${max_jobs}

85
86
ARG GIT_REPO_CHECK=0
# Support for building with non-AVX512 vLLM: docker build --build-arg VLLM_CPU_DISABLE_AVX512="true" ...
87
ARG VLLM_CPU_DISABLE_AVX512=0
88
ENV VLLM_CPU_DISABLE_AVX512=${VLLM_CPU_DISABLE_AVX512}
89
90
91
92
93
94
# Support for building with AVX512BF16 ISA: docker build --build-arg VLLM_CPU_AVX512BF16="true" ...
ARG VLLM_CPU_AVX512BF16=0
ENV VLLM_CPU_AVX512BF16=${VLLM_CPU_AVX512BF16}
# Support for building with AVX512VNNI ISA: docker build --build-arg VLLM_CPU_AVX512VNNI="true" ...
ARG VLLM_CPU_AVX512VNNI=0
ENV VLLM_CPU_AVX512VNNI=${VLLM_CPU_AVX512VNNI}
95

96
97
WORKDIR /workspace/vllm

98
RUN --mount=type=cache,target=/root/.cache/uv \
99
    --mount=type=bind,src=requirements/cpu-build.txt,target=requirements/build.txt \
100
    uv pip install -r requirements/build.txt
101

102
103
104
COPY . .
RUN --mount=type=bind,source=.git,target=.git \
    if [ "$GIT_REPO_CHECK" != 0 ]; then bash tools/check_repo.sh ; fi
105

106
107
RUN --mount=type=cache,target=/root/.cache/uv \
    --mount=type=cache,target=/root/.cache/ccache \
108
    --mount=type=cache,target=/workspace/vllm/.deps,sharing=locked \
109
    --mount=type=bind,source=.git,target=.git \
110
    VLLM_TARGET_DEVICE=cpu python3 setup.py bdist_wheel --dist-dir=dist --py-limited-api=cp38
111

112
113
114
115
116
######################### TEST DEPS #########################
FROM base AS vllm-test-deps

WORKDIR /workspace/vllm

117
# TODO: Update to 2.9.0 when there is a new build for intel_extension_for_pytorch for that version
118
119
120
RUN --mount=type=bind,src=requirements/test.in,target=requirements/test.in \
    cp requirements/test.in requirements/cpu-test.in && \
    sed -i '/mamba_ssm/d' requirements/cpu-test.in && \
121
122
123
    sed -i 's/^torch==.*/torch==2.8.0/g' requirements/cpu-test.in && \
    sed -i 's/torchaudio.*/torchaudio/g' requirements/cpu-test.in && \
    sed -i 's/torchvision.*/torchvision/g' requirements/cpu-test.in && \
124
125
126
    uv pip compile requirements/cpu-test.in -o requirements/cpu-test.txt --index-strategy unsafe-best-match --torch-backend cpu

RUN --mount=type=cache,target=/root/.cache/uv \
127
    uv pip install -r requirements/cpu-test.txt
128

129
130
131
132
133
134
135
######################### DEV IMAGE #########################
FROM vllm-build AS vllm-dev

WORKDIR /workspace/vllm

RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
    --mount=type=cache,target=/var/lib/apt,sharing=locked \
136
    apt-get install -y --no-install-recommends vim numactl xz-utils
137
138
139

# install development dependencies (for testing)
RUN --mount=type=cache,target=/root/.cache/uv \
140
    uv pip install -e tests/vllm_test_utils
141

142
RUN --mount=type=cache,target=/root/.cache/uv \
143
    --mount=type=cache,target=/root/.cache/ccache \
144
    --mount=type=bind,source=.git,target=.git \
145
    VLLM_TARGET_DEVICE=cpu python3 setup.py develop
146

147
148
COPY --from=vllm-test-deps /workspace/vllm/requirements/cpu-test.txt requirements/test.txt

149
150
151
152
153
154
155
RUN --mount=type=cache,target=/root/.cache/uv \
    uv pip install -r requirements/dev.txt && \
    pre-commit install --hook-type pre-commit --hook-type commit-msg

ENTRYPOINT ["bash"]

######################### TEST IMAGE #########################
156
FROM vllm-test-deps AS vllm-test
157

158
159
WORKDIR /workspace/

160
161
162
163
164
165
166
RUN --mount=type=cache,target=/root/.cache/uv \
    --mount=type=bind,from=vllm-build,src=/workspace/vllm/dist,target=dist \
    uv pip install dist/*.whl

ADD ./tests/ ./tests/
ADD ./examples/ ./examples/
ADD ./benchmarks/ ./benchmarks/
167
ADD ./vllm/collect_env.py .
168
ADD ./.buildkite/ ./.buildkite/
169

170
171
172
# Create symlink for vllm-workspace to maintain CI compatibility
RUN ln -sf /workspace /vllm-workspace

youkaichao's avatar
youkaichao committed
173
# install development dependencies (for testing)
174
RUN --mount=type=cache,target=/root/.cache/uv \
175
    uv pip install -e tests/vllm_test_utils
176
177
178
179
180
181
182
183
184
185

######################### RELEASE IMAGE #########################
FROM base AS vllm-openai

WORKDIR /workspace/

RUN --mount=type=cache,target=/root/.cache/uv \
    --mount=type=cache,target=/root/.cache/ccache \
    --mount=type=bind,from=vllm-build,src=/workspace/vllm/dist,target=dist \
    uv pip install dist/*.whl
youkaichao's avatar
youkaichao committed
186

187
ENTRYPOINT ["vllm", "serve"]