Dockerfile.rocm 7.43 KB
Newer Older
1
# Usage (to build SGLang ROCm docker image):
Yineng Zhang's avatar
Yineng Zhang committed
2
3
4
#   docker build --build-arg SGL_BRANCH=v0.5.3rc0 --build-arg GPU_ARCH=gfx942 -t v0.5.3rc0-rocm630-mi30x -f Dockerfile.rocm .
#   docker build --build-arg SGL_BRANCH=v0.5.3rc0 --build-arg GPU_ARCH=gfx942-rocm700 -t v0.5.3rc0-rocm700-mi30x -f Dockerfile.rocm .
#   docker build --build-arg SGL_BRANCH=v0.5.3rc0 --build-arg GPU_ARCH=gfx950 -t v0.5.3rc0-rocm700-mi35x -f Dockerfile.rocm .
sogalin's avatar
sogalin committed
5

6
7
8

# Default base images
ARG BASE_IMAGE_942="rocm/sgl-dev:vllm20250114"
9
10
ARG BASE_IMAGE_942_ROCM700="rocm/sgl-dev:rocm7-vllm-20250904"
ARG BASE_IMAGE_950="rocm/sgl-dev:rocm7-vllm-20250904"
11
12
13
14
15

# This is necessary for scope purpose
ARG GPU_ARCH=gfx950

# ===============================
sogalin's avatar
sogalin committed
16
# Base image 942 with rocm630 and args
17
18
19
FROM $BASE_IMAGE_942 AS gfx942
ENV BUILD_VLLM="0"
ENV BUILD_TRITON="1"
20
ENV BUILD_LLVM="0"
21
ENV BUILD_AITER_ALL="1"
22
ENV BUILD_MOONCAKE="1"
23
ENV AITER_COMMIT="v0.1.4"
24
ENV NO_DEPS_FLAG=""
25

sogalin's avatar
sogalin committed
26
27
28
29
30
31
32
33
34
35
36
# ===============================
# Base image 942 and args
FROM $BASE_IMAGE_942_ROCM700 AS gfx942-rocm700
ENV BUILD_VLLM="0"
ENV BUILD_TRITON="0"
ENV BUILD_LLVM="0"
ENV BUILD_AITER_ALL="1"
ENV BUILD_MOONCAKE="1"
ENV AITER_COMMIT="v0.1.5"
ENV NO_DEPS_FLAG=""

37
38
39
40
41
# ===============================
# Base image 950 and args
FROM $BASE_IMAGE_950 AS gfx950
ENV BUILD_VLLM="0"
ENV BUILD_TRITON="0"
sogalin's avatar
sogalin committed
42
ENV BUILD_LLVM="0"
43
ENV BUILD_AITER_ALL="1"
sogalin's avatar
sogalin committed
44
45
ENV BUILD_MOONCAKE="1"
ENV AITER_COMMIT="v0.1.5"
46
ENV NO_DEPS_FLAG="--no-deps"
47
48
49
50
51
52
53

# ===============================
# Chosen arch and args
FROM ${GPU_ARCH}

# This is necessary for scope purpose, again
ARG GPU_ARCH=gfx950
sogalin's avatar
sogalin committed
54
ENV GPU_ARCH_LIST=${GPU_ARCH%-*}
55
56
57
58
59
60
61

ARG SGL_REPO="https://github.com/sgl-project/sglang.git"
ARG SGL_DEFAULT="main"
ARG SGL_BRANCH=${SGL_DEFAULT}

ARG TRITON_REPO="https://github.com/ROCm/triton.git"
ARG TRITON_COMMIT="improve_fa_decode_3.0.0"
62

63
ARG AITER_REPO="https://github.com/ROCm/aiter.git"
64

65
66
67
68
ARG LLVM_REPO="https://github.com/jrbyrnes/llvm-project.git"
ARG LLVM_BRANCH="MainOpSelV2"
ARG LLVM_COMMIT="6520ace8227ffe2728148d5f3b9872a870b0a560"

69
ARG MOONCAKE_REPO="https://github.com/kvcache-ai/Mooncake.git"
sogalin's avatar
sogalin committed
70
ARG MOONCAKE_COMMIT="dcdf1c784b40aa6975a8ed89fe26321b028e40e8"
71

72
73
USER root

74
75
76
# Install some basic utilities
RUN python -m pip install --upgrade pip && pip install setuptools_scm
RUN apt-get purge -y sccache; python -m pip uninstall -y sccache; rm -f "$(which sccache)"
77

78
WORKDIR /sgl-workspace
79

80
81
82
# -----------------------
# llvm
RUN if [ "$BUILD_LLVM" = "1" ]; then \
sogalin's avatar
sogalin committed
83
     ENV HIP_CLANG_PATH="/sgl-workspace/llvm-project/build/bin/" \
84
85
86
87
88
89
90
91
92
93
94
     git clone --single-branch ${LLVM_REPO} -b ${LLVM_BRANCH} \
     && cd llvm-project \
     && git checkout ${LLVM_COMMIT} \
     && mkdir build \
     && cd build \
     && cmake -DCMAKE_BUILD_TYPE=Release -DLLVM_ENABLE_ASSERTIONS=1 -DLLVM_TARGETS_TO_BUILD="AMDGPU;X86" -DLLVM_ENABLE_PROJECTS="clang;lld;" -DLLVM_ENABLE_RUNTIMES="compiler-rt" ../llvm \
     && make -j$(nproc); \
    fi

# -----------------------

95
96
97
98
99
100
101
102
# -----------------------
# AITER
RUN pip uninstall -y aiter
RUN git clone ${AITER_REPO} \
 && cd aiter \
 && git checkout ${AITER_COMMIT} \
 && git submodule update --init --recursive
RUN cd aiter \
103
104
105
     && if [ "$BUILD_AITER_ALL" = "1" ] && [ "$BUILD_LLVM" = "1" ]; then \
          HIP_CLANG_PATH=/sgl-workspace/llvm-project/build/bin/ PREBUILD_KERNELS=1 GPU_ARCHS=$GPU_ARCH_LIST python setup.py develop; \
        elif [ "$BUILD_AITER_ALL" = "1" ]; then \
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
          PREBUILD_KERNELS=1 GPU_ARCHS=$GPU_ARCH_LIST python setup.py develop; \
        else \
          GPU_ARCHS=$GPU_ARCH_LIST python setup.py develop; \
        fi

# -----------------------
# Triton
RUN if [ "$BUILD_TRITON" = "1" ]; then \
        pip uninstall -y triton \
     && git clone ${TRITON_REPO} \
     && cd triton \
     && git checkout ${TRITON_COMMIT} \
     && cd python \
     && python setup.py install; \
    fi

# -----------------------
# Build vLLM
ARG VLLM_REPO="https://github.com/ROCm/vllm.git"
ARG VLLM_BRANCH="9f6b92db47c3444b7a7d67451ba0c3a2d6af4c2c"
RUN if [ "$BUILD_VLLM" = "1" ]; then \
        git clone ${VLLM_REPO} \
     && cd vllm \
     && git checkout ${VLLM_BRANCH} \
     && python -m pip install -r requirements/rocm.txt \
     && python setup.py clean --all \
     && python setup.py develop; \
    fi

135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
# -----------------------
# Build Mooncake
ENV PATH=$PATH:/usr/local/go/bin

RUN if [ "$BUILD_MOONCAKE" = "1" ]; then \
     apt update && apt install -y zip unzip wget && \
     apt install -y gcc make libtool autoconf  librdmacm-dev rdmacm-utils infiniband-diags ibverbs-utils perftest ethtool  libibverbs-dev rdma-core && \
     apt install -y openssh-server openmpi-bin openmpi-common libopenmpi-dev && \
     git clone ${MOONCAKE_REPO} && \
     cd Mooncake && \
     git checkout ${MOONCAKE_COMMIT} && \
     git submodule update --init --recursive && \
     bash dependencies.sh -y && \
     rm -rf /usr/local/go && \
     wget https://go.dev/dl/go1.22.2.linux-amd64.tar.gz && \
     tar -C /usr/local -xzf go1.22.2.linux-amd64.tar.gz && \
     rm go1.22.2.linux-amd64.tar.gz && \
     mkdir -p build && \
     cd build && \
     cmake .. -DUSE_ETCD=ON && \
     make -j "$(nproc)" && make install; \
    fi


159
160
161
# -----------------------
# Build SGLang
ARG BUILD_TYPE=all
162

163
164
165
RUN pip install IPython \
    && pip install orjson \
    && pip install python-multipart \
sogalin's avatar
sogalin committed
166
    && pip install torchao==0.9.0 \
167
    && pip install pybind11
168

169
RUN pip uninstall -y sgl_kernel sglang
170
171
172
173
RUN git clone ${SGL_REPO} \
    && cd sglang \
    && if [ "${SGL_BRANCH}" = ${SGL_DEFAULT} ]; then \
         echo "Using ${SGL_DEFAULT}, default branch."; \
174
         git checkout ${SGL_DEFAULT}; \
175
176
177
178
       else \
         echo "Using ${SGL_BRANCH} branch."; \
         git checkout ${SGL_BRANCH}; \
       fi \
179
    && cd sgl-kernel \
180
181
    && rm -f pyproject.toml \
    && mv pyproject_rocm.toml pyproject.toml \
182
    && AMDGPU_TARGET=$GPU_ARCH_LIST python setup_rocm.py install \
183
    && cd .. \
184
    && rm -rf python/pyproject.toml && mv python/pyproject_other.toml python/pyproject.toml \
185
    && if [ "$BUILD_TYPE" = "srt" ]; then \
186
         python -m pip --no-cache-dir install -e "python[srt_hip]" ${NO_DEPS_FLAG}; \
187
       else \
188
         python -m pip --no-cache-dir install -e "python[all_hip]" ${NO_DEPS_FLAG}; \
189
190
191
192
       fi

RUN python -m pip cache purge

193
194
195
196
197
# Copy config files to support MI300X in virtualized environments (MI300X_VF).  Symlinks will not be created in image build.
RUN find /sgl-workspace/sglang/python/sglang/srt/layers/quantization/configs/ \
         /sgl-workspace/sglang/python/sglang/srt/layers/moe/fused_moe_triton/configs/ \
         -type f -name '*MI300X*' | xargs -I {} sh -c 'vf_config=$(echo "$1" | sed "s/MI300X/MI300X_VF/"); cp "$1" "$vf_config"' -- {}

198
199
200
201
202
203
204
205
206
207
208
209
# Install Rust toolchain for sgl-router
ENV PATH="/root/.cargo/bin:${PATH}"
RUN curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y \
    && rustc --version && cargo --version

# Build and install sgl-router
RUN python3 -m pip install --no-cache-dir setuptools-rust \
    && cd /sgl-workspace/sglang/sgl-router \
    && cargo build --release \
    && python3 -m pip install --no-cache-dir . \
    && rm -rf /root/.cache

210
211
# Performance environment variable.
ENV HIP_FORCE_DEV_KERNARG=1
HAI's avatar
HAI committed
212
ENV HSA_NO_SCRATCH_RECLAIM=1
213
ENV SGLANG_SET_CPU_AFFINITY=1
214
215
216
ENV SGLANG_ALLOW_OVERWRITE_LONGER_CONTEXT_LEN=1
ENV NCCL_MIN_NCHANNELS=112

217
ENV SGLANG_USE_AITER=1
HAI's avatar
HAI committed
218
ENV SGLANG_MOE_PADDING=1
219
220
221
222
ENV VLLM_FP8_PADDING=1
ENV VLLM_FP8_ACT_PADDING=1
ENV VLLM_FP8_WEIGHT_PADDING=1
ENV VLLM_FP8_REDUCE_CONV=1
223
224
ENV TORCHINDUCTOR_MAX_AUTOTUNE=1
ENV TORCHINDUCTOR_MAX_AUTOTUNE_POINTWISE=1
225
226

CMD ["/bin/bash"]