Unverified Commit 7b979c00 authored by Krishnan Prashanth's avatar Krishnan Prashanth Committed by GitHub
Browse files

fix: Add accelerate to sglang runtime image for diffusion workers (#8357)


Signed-off-by: default avatarKrishnan Prashanth <kprashanth@nvidia.com>
parent 2e3d4a92
...@@ -50,6 +50,12 @@ RUN --mount=type=cache,target=/root/.cache/pip,sharing=locked \ ...@@ -50,6 +50,12 @@ RUN --mount=type=cache,target=/root/.cache/pip,sharing=locked \
/opt/dynamo/wheelhouse/ai_dynamo_runtime*.whl \ /opt/dynamo/wheelhouse/ai_dynamo_runtime*.whl \
/opt/dynamo/wheelhouse/ai_dynamo*any.whl /opt/dynamo/wheelhouse/ai_dynamo*any.whl
# Install accelerate for diffusion/video worker pipelines (diffusers requires it
# for enable_model_cpu_offload but the upstream SGLang runtime image omits it)
RUN --mount=type=cache,target=/root/.cache/pip,sharing=locked \
export PIP_CACHE_DIR=/root/.cache/pip && \
pip install --break-system-packages --no-deps "accelerate==1.13.0"
# Install gpu_memory_service wheel if enabled (all targets) # Install gpu_memory_service wheel if enabled (all targets)
ARG ENABLE_GPU_MEMORY_SERVICE ARG ENABLE_GPU_MEMORY_SERVICE
RUN --mount=type=cache,target=/root/.cache/pip,sharing=locked \ RUN --mount=type=cache,target=/root/.cache/pip,sharing=locked \
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment