"lib/bindings/vscode:/vscode.git/clone" did not exist on "a79122c6e06e03db993951f2c1e74ac65dd62d48"
Unverified Commit 47c3dad7 authored by ishandhanani's avatar ishandhanani Committed by GitHub
Browse files

chore(sglang): support dp attention routing (#1415)

parent d83633b5
......@@ -135,9 +135,8 @@ RUN if [ "$ARCH" = "arm64" ]; then \
# Install sglang
# Once either 0.4.6post6 or 0.4.7 is released, we can switch back to using the published version
# This commit references multiple perf fixes for DP attention and NIXL https://github.com/sgl-project/sglang/pull/6780
# 6/2(ishan) - moving to ToT for performance purposes
ARG SGLANG_COMMIT="6376b632eb4daef306b89ede0eabdcb89ddff728"
# This commit references a fix to add DP attention based routing along with other perf fixes https://github.com/sgl-project/sglang/pull/6884
ARG SGLANG_COMMIT="f1569876d54dd3b6601f5280f12652e9fbb1375c"
RUN --mount=type=cache,target=/root/.cache/uv \
git clone https://github.com/sgl-project/sglang.git && \
cd sglang && \
......
......@@ -60,3 +60,4 @@ class DisaggPreprocessedRequest(BaseModel):
bootstrap_host: str
bootstrap_port: int
bootstrap_room: int
data_parallel_rank: Optional[int] = None
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment