Unverified Commit da0c5726 authored by ishandhanani's avatar ishandhanani Committed by GitHub
Browse files

chore: update sgl version and fix h100 wideep example (#2169)

parent 30d4612e
...@@ -176,7 +176,6 @@ uv pip install ai-dynamo[sglang] ...@@ -176,7 +176,6 @@ uv pip install ai-dynamo[sglang]
Run the backend/worker like this: Run the backend/worker like this:
``` ```
# Note the '.worker' in the module path for SGLang
python -m dynamo.sglang.worker --help python -m dynamo.sglang.worker --help
``` ```
......
...@@ -9,15 +9,13 @@ Dynamo supports SGLang's implementation of wide expert parallelism and large sca ...@@ -9,15 +9,13 @@ Dynamo supports SGLang's implementation of wide expert parallelism and large sca
## Instructions ## Instructions
1. Build the SGLang DeepEP container. 1. Pull the SGLang container.
```bash ```bash
git clone -b v0.4.9.post2 https://github.com/sgl-project/sglang.git docker pull lmsysorg/sglang:latest
cd sglang/docker
docker build -f Dockerfile -t sgl-widepep .
``` ```
You will now have a `sgl-widepep:latest` image You can also pull a specific tag from the [lmsys dockerhub](https://hub.docker.com/r/lmsysorg/sglang/tags)
2. Build the Dynamo container 2. Build the Dynamo container
......
...@@ -27,7 +27,7 @@ ARG ARCH=amd64 ...@@ -27,7 +27,7 @@ ARG ARCH=amd64
ARG ARCH_ALT=x86_64 ARG ARCH_ALT=x86_64
# Make sure to update the dependency version in pyproject.toml when updating this # Make sure to update the dependency version in pyproject.toml when updating this
ARG SGLANG_VERSION="0.4.9.post1" ARG SGLANG_VERSION="0.4.9.post6"
################################## ##################################
########## Base Image ############ ########## Base Image ############
......
...@@ -13,9 +13,9 @@ ...@@ -13,9 +13,9 @@
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# Note this container is built from a local dockerfile # This should be pinned to the sglang version that is installed with Dynamo
# Please see instructions in examples/sglang/README.md # in the pyproject.toml
FROM sgl-wideep:latest FROM lmsysorg/sglang:v0.4.9.post6-cu126
# Add NIXL build dependencies # Add NIXL build dependencies
RUN apt-get update -y && \ RUN apt-get update -y && \
...@@ -80,10 +80,7 @@ WORKDIR /sgl-workspace ...@@ -80,10 +80,7 @@ WORKDIR /sgl-workspace
ENV SGL_FORCE_SHUTDOWN=1 ENV SGL_FORCE_SHUTDOWN=1
WORKDIR /sgl-workspace WORKDIR /sgl-workspace
# include flush cache endpoint and server support RUN git clone https://github.com/ai-dynamo/dynamo.git
# https://github.com/ai-dynamo/dynamo/pull/1769
ARG DYNAMO_COMMIT="bd91dca6141e05bcfbe9bd4dea54cc58b9e37d75"
RUN git clone https://github.com/ai-dynamo/dynamo.git && cd dynamo && git checkout ${DYNAMO_COMMIT}
# install dynamo in editable mode # install dynamo in editable mode
WORKDIR /sgl-workspace/dynamo WORKDIR /sgl-workspace/dynamo
...@@ -126,8 +123,6 @@ RUN cargo build --release ...@@ -126,8 +123,6 @@ RUN cargo build --release
RUN cd lib/bindings/python && pip install --break-system-packages -e . && cd ../../.. RUN cd lib/bindings/python && pip install --break-system-packages -e . && cd ../../..
RUN pip install --break-system-packages -e . RUN pip install --break-system-packages -e .
ENV PYTHONPATH=/sgl-workspace/dynamo/components/planner/src:/sgl-workspace/dynamo/examples/sglang:$PYTHONPATH
RUN wget --tries=3 --waitretry=5 https://github.com/nats-io/nats-server/releases/download/v2.10.28/nats-server-v2.10.28-${ARCH}.deb && \ RUN wget --tries=3 --waitretry=5 https://github.com/nats-io/nats-server/releases/download/v2.10.28/nats-server-v2.10.28-${ARCH}.deb && \
dpkg -i nats-server-v2.10.28-${ARCH}.deb && rm nats-server-v2.10.28-${ARCH}.deb dpkg -i nats-server-v2.10.28-${ARCH}.deb && rm nats-server-v2.10.28-${ARCH}.deb
...@@ -168,7 +163,7 @@ ENV PATH=/sgl-workspace/perf_analyzer/build/perf_analyzer/src/perf-analyzer-buil ...@@ -168,7 +163,7 @@ ENV PATH=/sgl-workspace/perf_analyzer/build/perf_analyzer/src/perf-analyzer-buil
RUN pip install --break-system-packages genai-perf RUN pip install --break-system-packages genai-perf
COPY examples/sglang/configs/deepseek_r1/wideep/* /sgl-workspace/dynamo/examples/sglang/configs/ # https://pypi.org/project/sglang-router/0.1.5 is latest
COPY examples/sglang/utils/benchmarking/* /sgl-workspace/dynamo/examples/sglang/utils/ RUN pip install sglang-router==0.1.5
WORKDIR /sgl-workspace/dynamo/examples/sglang WORKDIR /sgl-workspace/dynamo/components/backends/sglang
...@@ -73,10 +73,7 @@ vllm = [ ...@@ -73,10 +73,7 @@ vllm = [
sglang = [ sglang = [
"uvloop", "uvloop",
"nixl", "nixl",
"sglang[runtime_common]==0.4.9.post1", "sglang[all]==0.4.9.post6",
"einops",
"sgl-kernel==0.2.4",
"sentencepiece",
] ]
llama_cpp = [ llama_cpp = [
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment