Dockerfile.rocm 2.59 KB
Newer Older
1
# Usage (to build SGLang ROCm docker image):
2
#   docker build --build-arg SGL_BRANCH=v0.4.6.post1 -t v0.4.6.post1-rocm630 -f Dockerfile.rocm .
3
4

# default base image
5
ARG BASE_IMAGE="rocm/sgl-dev:vllm20250114"
6
7
8
9
10

FROM $BASE_IMAGE AS base
USER root

WORKDIR /sgl-workspace
11
ARG BUILD_TYPE=all
12
13
14
15
ARG SGL_REPO="https://github.com/sgl-project/sglang"
ENV SGL_DEFAULT="main"
ARG SGL_BRANCH=${SGL_DEFAULT}

HAI's avatar
HAI committed
16
17
ARG TRITON_REPO="https://github.com/ROCm/triton.git"
ARG TRITON_COMMIT="improve_fa_decode_3.0.0"
18

19

20
ARG AITER_REPO="https://github.com/ROCm/aiter.git"
HAI's avatar
HAI committed
21
ARG AITER_COMMIT="v0.1.1"
22

23
24
25
26
27
28
29
30
RUN git clone ${SGL_REPO} \
    && cd sglang \
    && if [ "${SGL_BRANCH}" = ${SGL_DEFAULT} ]; then \
         echo "Using ${SGL_DEFAULT}, default branch."; \
       else \
         echo "Using ${SGL_BRANCH} branch."; \
         git checkout ${SGL_BRANCH}; \
       fi \
31
    && cd sgl-kernel \
32
33
    && rm -f pyproject.toml \
    && mv pyproject_rocm.toml pyproject.toml \
34
35
    && python setup_rocm.py install \
    && cd .. \
36
37
38
39
40
41
42
43
44
    && if [ "$BUILD_TYPE" = "srt" ]; then \
         python -m pip --no-cache-dir install -e "python[srt_hip]"; \
       else \
         python -m pip --no-cache-dir install -e "python[all_hip]"; \
       fi

RUN cp -r /sgl-workspace/sglang /sglang
RUN python -m pip cache purge

kk's avatar
kk committed
45
46
47
48
49
50
RUN pip install IPython \
    && pip install orjson \
    && pip install python-multipart \
    && pip install torchao \
    && pip install pybind11

51
52
53
54
55
56
57
RUN pip uninstall -y triton
RUN git clone ${TRITON_REPO} \
    && cd triton \
    && git checkout ${TRITON_COMMIT} \
    && cd python \
    && python3 setup.py install

58
59
60
RUN git clone ${AITER_REPO} \
    && cd aiter \
    && git checkout ${AITER_COMMIT} \
61
62
63
    && git submodule update --init --recursive \
    && PREBUILD_KERNELS=1 GPU_ARCHS=gfx942 python3 setup.py develop

64
65
66
67
68
# Copy config files to support MI300X in virtualized environments (MI300X_VF).  Symlinks will not be created in image build.
RUN find /sgl-workspace/sglang/python/sglang/srt/layers/quantization/configs/ \
         /sgl-workspace/sglang/python/sglang/srt/layers/moe/fused_moe_triton/configs/ \
         -type f -name '*MI300X*' | xargs -I {} sh -c 'vf_config=$(echo "$1" | sed "s/MI300X/MI300X_VF/"); cp "$1" "$vf_config"' -- {}

69
70
71
# Performance environment variable.

ENV HIP_FORCE_DEV_KERNARG=1
HAI's avatar
HAI committed
72
ENV HSA_NO_SCRATCH_RECLAIM=1
73
ENV SGLANG_SET_CPU_AFFINITY=1
74
75
76
ENV SGLANG_ALLOW_OVERWRITE_LONGER_CONTEXT_LEN=1
ENV NCCL_MIN_NCHANNELS=112

HAI's avatar
HAI committed
77
ENV SGLANG_MOE_PADDING=1
78
79
80
81
ENV VLLM_FP8_PADDING=1
ENV VLLM_FP8_ACT_PADDING=1
ENV VLLM_FP8_WEIGHT_PADDING=1
ENV VLLM_FP8_REDUCE_CONV=1
82
83
ENV TORCHINDUCTOR_MAX_AUTOTUNE=1
ENV TORCHINDUCTOR_MAX_AUTOTUNE_POINTWISE=1
84
85

CMD ["/bin/bash"]