"server/text_generation_server/models/t5.py" did not exist on "fa43fb71be75064de58784e96b16b14f7b3b4912"
Unverified Commit b6e0cfb5 authored by kk's avatar kk Committed by GitHub
Browse files

ROCm base image update (#2692)


Co-authored-by: default avatarwunhuang <wunhuang@amd.com>
parent 0d8d97b8
...@@ -2,7 +2,7 @@ ...@@ -2,7 +2,7 @@
# docker build --build-arg SGL_BRANCH=v0.4.1.post3 -t v0.4.1.post3-rocm620 -f Dockerfile.rocm . # docker build --build-arg SGL_BRANCH=v0.4.1.post3 -t v0.4.1.post3-rocm620 -f Dockerfile.rocm .
# default base image # default base image
ARG BASE_IMAGE="rocm/vllm-dev:20241022" ARG BASE_IMAGE="rocm/vllm-dev:20241031-tuned"
FROM $BASE_IMAGE AS base FROM $BASE_IMAGE AS base
USER root USER root
...@@ -33,6 +33,12 @@ RUN git clone ${SGL_REPO} \ ...@@ -33,6 +33,12 @@ RUN git clone ${SGL_REPO} \
RUN cp -r /sgl-workspace/sglang /sglang RUN cp -r /sgl-workspace/sglang /sglang
RUN python -m pip cache purge RUN python -m pip cache purge
RUN pip install IPython \
&& pip install orjson \
&& pip install python-multipart \
&& pip install torchao \
&& pip install pybind11
RUN pip uninstall -y triton RUN pip uninstall -y triton
RUN git clone ${TRITON_REPO} \ RUN git clone ${TRITON_REPO} \
&& cd triton \ && cd triton \
......
...@@ -27,7 +27,7 @@ srt = ["sglang[runtime_common]", "torch", "vllm>=0.6.3.post1,<=0.6.4.post1", "cu ...@@ -27,7 +27,7 @@ srt = ["sglang[runtime_common]", "torch", "vllm>=0.6.3.post1,<=0.6.4.post1", "cu
# HIP (Heterogeneous-computing Interface for Portability) for AMD # HIP (Heterogeneous-computing Interface for Portability) for AMD
# => base docker rocm/vllm-dev:20241022, not from public vllm whl # => base docker rocm/vllm-dev:20241022, not from public vllm whl
srt_hip = ["sglang[runtime_common]", "torch", "vllm==0.6.3.dev13"] srt_hip = ["sglang[runtime_common]", "torch", "vllm==0.6.3.post2.dev1"]
# xpu is not enabled in public vllm and torch whl, # xpu is not enabled in public vllm and torch whl,
# need to follow https://docs.vllm.ai/en/latest/getting_started/xpu-installation.htmlinstall vllm # need to follow https://docs.vllm.ai/en/latest/getting_started/xpu-installation.htmlinstall vllm
srt_xpu = ["sglang[runtime_common]"] srt_xpu = ["sglang[runtime_common]"]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment