Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
c0c6f543
Unverified
Commit
c0c6f543
authored
Sep 16, 2025
by
Yineng Zhang
Committed by
GitHub
Sep 16, 2025
Browse files
chore: upgrade sgl-kernel 0.3.10 (#10500)
parent
edd6a07b
Changes
5
Hide whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
10 additions
and
10 deletions
+10
-10
docker/Dockerfile
docker/Dockerfile
+1
-1
docker/Dockerfile.gb200
docker/Dockerfile.gb200
+1
-1
python/pyproject.toml
python/pyproject.toml
+4
-4
python/pyproject_other.toml
python/pyproject_other.toml
+3
-3
python/sglang/srt/entrypoints/engine.py
python/sglang/srt/entrypoints/engine.py
+1
-1
No files found.
docker/Dockerfile
View file @
c0c6f543
...
@@ -85,7 +85,7 @@ RUN python3 -m pip install --no-cache-dir --upgrade pip setuptools wheel html5li
...
@@ -85,7 +85,7 @@ RUN python3 -m pip install --no-cache-dir --upgrade pip setuptools wheel html5li
&&
python3
-m
pip
install
--no-cache-dir
nvidia-nccl-cu12
==
2.27.6
--force-reinstall
--no-deps
\
&&
python3
-m
pip
install
--no-cache-dir
nvidia-nccl-cu12
==
2.27.6
--force-reinstall
--no-deps
\
&&
python3
-m
flashinfer
--download-cubin
\
&&
python3
-m
flashinfer
--download-cubin
\
&&
if
[
"
$CUDA_VERSION
"
=
"12.6.1"
]
;
then
\
&&
if
[
"
$CUDA_VERSION
"
=
"12.6.1"
]
;
then
\
python3
-m
pip
install
--no-cache-dir
https://github.com/sgl-project/whl/releases/download/v0.3.
9.post2
/sgl_kernel-0.3.
9.post2
+cu124-cp310-abi3-manylinux2014_x86_64.whl
--force-reinstall
--no-deps
;
\
python3
-m
pip
install
--no-cache-dir
https://github.com/sgl-project/whl/releases/download/v0.3.
10
/sgl_kernel-0.3.
10
+cu124-cp310-abi3-manylinux2014_x86_64.whl
--force-reinstall
--no-deps
;
\
fi
fi
# Download source files
# Download source files
...
...
docker/Dockerfile.gb200
View file @
c0c6f543
...
@@ -4,7 +4,7 @@ FROM nvidia/cuda:${CUDA_VERSION}-cudnn-devel-ubuntu22.04
...
@@ -4,7 +4,7 @@ FROM nvidia/cuda:${CUDA_VERSION}-cudnn-devel-ubuntu22.04
ARG BUILD_TYPE=blackwell
ARG BUILD_TYPE=blackwell
ARG DEEPEP_COMMIT=1b14ad661c7640137fcfe93cccb2694ede1220b0
ARG DEEPEP_COMMIT=1b14ad661c7640137fcfe93cccb2694ede1220b0
ARG CMAKE_BUILD_PARALLEL_LEVEL=2
ARG CMAKE_BUILD_PARALLEL_LEVEL=2
ARG SGL_KERNEL_VERSION=0.3.
9.post2
ARG SGL_KERNEL_VERSION=0.3.
10
ENV DEBIAN_FRONTEND=noninteractive \
ENV DEBIAN_FRONTEND=noninteractive \
CUDA_HOME=/usr/local/cuda \
CUDA_HOME=/usr/local/cuda \
GDRCOPY_HOME=/usr/src/gdrdrv-2.4.4/ \
GDRCOPY_HOME=/usr/src/gdrdrv-2.4.4/ \
...
...
python/pyproject.toml
View file @
c0c6f543
...
@@ -57,7 +57,7 @@ dependencies = [
...
@@ -57,7 +57,7 @@ dependencies = [
"uvicorn"
,
"uvicorn"
,
"uvloop"
,
"uvloop"
,
"xgrammar==0.1.24"
,
"xgrammar==0.1.24"
,
"sgl-kernel==0.3.
9.post2
"
,
"sgl-kernel==0.3.
10
"
,
"torch==2.8.0"
,
"torch==2.8.0"
,
"torchaudio==2.8.0"
,
"torchaudio==2.8.0"
,
"torchvision"
,
"torchvision"
,
...
@@ -67,10 +67,10 @@ dependencies = [
...
@@ -67,10 +67,10 @@ dependencies = [
"tiktoken"
,
"tiktoken"
,
"anthropic>=0.20.0"
,
"anthropic>=0.20.0"
,
"torch_memory_saver==0.0.8"
,
"torch_memory_saver==0.0.8"
,
"decord"
,
]
]
[project.optional-dependencies]
[project.optional-dependencies]
decord
=
["decord"]
test
=
[
test
=
[
"accelerate"
,
"accelerate"
,
"expecttest"
,
"expecttest"
,
...
@@ -88,8 +88,8 @@ tracing = [
...
@@ -88,8 +88,8 @@ tracing = [
"opentelemetry-exporter-otlp"
,
"opentelemetry-exporter-otlp"
,
"opentelemetry-exporter-otlp-proto-grpc"
,
"opentelemetry-exporter-otlp-proto-grpc"
,
]
]
all
=
["sglang[test]"]
all
=
["sglang[test]
"
, "
sglang
[decord]"
]
blackwell
=
[
"nvidia-cutlass-dsl==4.
1
.0"
,
"sglang[test]"
]
blackwell
=
[
"nvidia-cutlass-dsl==4.
2
.0"
,
"sglang[test]"
]
dev
=
["sglang[test]"]
dev
=
["sglang[test]"]
[project.urls]
[project.urls]
...
...
python/pyproject_other.toml
View file @
c0c6f543
...
@@ -65,7 +65,7 @@ tracing = [
...
@@ -65,7 +65,7 @@ tracing = [
srt
=
[
srt
=
[
"sglang[runtime_common]"
,
"sglang[runtime_common]"
,
"sgl-kernel==0.3.
9.post2
"
,
"sgl-kernel==0.3.
10
"
,
"torch==2.8.0"
,
"torch==2.8.0"
,
"torchaudio==2.8.0"
,
"torchaudio==2.8.0"
,
"torchvision"
,
"torchvision"
,
...
@@ -75,13 +75,13 @@ srt = [
...
@@ -75,13 +75,13 @@ srt = [
blackwell
=
[
blackwell
=
[
"sglang[runtime_common]"
,
"sglang[runtime_common]"
,
"sgl-kernel==0.3.
9.post2
"
,
"sgl-kernel==0.3.
10
"
,
"torch==2.8.0"
,
"torch==2.8.0"
,
"torchaudio==2.8.0"
,
"torchaudio==2.8.0"
,
"torchvision"
,
"torchvision"
,
"cuda-python"
,
"cuda-python"
,
"flashinfer_python==0.3.1"
,
"flashinfer_python==0.3.1"
,
"nvidia-cutlass-dsl==4.
1
.0"
,
"nvidia-cutlass-dsl==4.
2
.0"
,
]
]
# HIP (Heterogeneous-computing Interface for Portability) for AMD
# HIP (Heterogeneous-computing Interface for Portability) for AMD
...
...
python/sglang/srt/entrypoints/engine.py
View file @
c0c6f543
...
@@ -690,7 +690,7 @@ def _set_envs_and_config(server_args: ServerArgs):
...
@@ -690,7 +690,7 @@ def _set_envs_and_config(server_args: ServerArgs):
if
_is_cuda
and
not
get_bool_env_var
(
"SGLANG_SKIP_SGL_KERNEL_VERSION_CHECK"
):
if
_is_cuda
and
not
get_bool_env_var
(
"SGLANG_SKIP_SGL_KERNEL_VERSION_CHECK"
):
assert_pkg_version
(
assert_pkg_version
(
"sgl-kernel"
,
"sgl-kernel"
,
"0.3.
9.post2
"
,
"0.3.
10
"
,
"Please reinstall the latest version with `pip install sgl-kernel --force-reinstall`"
,
"Please reinstall the latest version with `pip install sgl-kernel --force-reinstall`"
,
)
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment