Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
ed89837c
Unverified
Commit
ed89837c
authored
Jun 15, 2025
by
JieXin Liang
Committed by
GitHub
Jun 14, 2025
Browse files
chore: upgrade sgl-kernel v0.1.8.post2 (#7186)
Co-authored-by:
zhyncs
<
me@zhyncs.com
>
parent
55561e25
Changes
4
Show whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
8 additions
and
3 deletions
+8
-3
python/pyproject.toml
python/pyproject.toml
+1
-1
python/sglang/srt/entrypoints/engine.py
python/sglang/srt/entrypoints/engine.py
+1
-1
python/sglang/srt/layers/attention/cutlass_mla_backend.py
python/sglang/srt/layers/attention/cutlass_mla_backend.py
+1
-0
python/sglang/srt/layers/quantization/deep_gemm_wrapper/entrypoint.py
...g/srt/layers/quantization/deep_gemm_wrapper/entrypoint.py
+5
-1
No files found.
python/pyproject.toml
View file @
ed89837c
...
@@ -49,7 +49,7 @@ runtime_common = [
...
@@ -49,7 +49,7 @@ runtime_common = [
srt
=
[
srt
=
[
"sglang[runtime_common]"
,
"sglang[runtime_common]"
,
"sgl-kernel==0.1.8.post
1
"
,
"sgl-kernel==0.1.8.post
2
"
,
"flashinfer_python==0.2.6.post1"
,
"flashinfer_python==0.2.6.post1"
,
"torch==2.7.1"
,
"torch==2.7.1"
,
"torchaudio==2.7.1"
,
"torchaudio==2.7.1"
,
...
...
python/sglang/srt/entrypoints/engine.py
View file @
ed89837c
...
@@ -605,7 +605,7 @@ def _set_envs_and_config(server_args: ServerArgs):
...
@@ -605,7 +605,7 @@ def _set_envs_and_config(server_args: ServerArgs):
if
_is_cuda
:
if
_is_cuda
:
assert_pkg_version
(
assert_pkg_version
(
"sgl-kernel"
,
"sgl-kernel"
,
"0.1.8.post
1
"
,
"0.1.8.post
2
"
,
"Please reinstall the latest version with `pip install sgl-kernel --force-reinstall`"
,
"Please reinstall the latest version with `pip install sgl-kernel --force-reinstall`"
,
)
)
...
...
python/sglang/srt/layers/attention/cutlass_mla_backend.py
View file @
ed89837c
...
@@ -280,6 +280,7 @@ class CutlassMLABackend(FlashInferMLAAttnBackend):
...
@@ -280,6 +280,7 @@ class CutlassMLABackend(FlashInferMLAAttnBackend):
seq_lens
=
forward_batch
.
seq_lens
.
to
(
torch
.
int32
),
seq_lens
=
forward_batch
.
seq_lens
.
to
(
torch
.
int32
),
page_table
=
self
.
forward_metadata
.
block_kv_indices
,
page_table
=
self
.
forward_metadata
.
block_kv_indices
,
workspace
=
self
.
forward_metadata
.
workspace
,
workspace
=
self
.
forward_metadata
.
workspace
,
sm_scale
=
layer
.
scaling
,
num_kv_splits
=
1
,
num_kv_splits
=
1
,
)
)
...
...
python/sglang/srt/layers/quantization/deep_gemm_wrapper/entrypoint.py
View file @
ed89837c
...
@@ -52,7 +52,11 @@ def grouped_gemm_nt_f8f8bf16_masked(
...
@@ -52,7 +52,11 @@ def grouped_gemm_nt_f8f8bf16_masked(
expected_m
,
n
,
k
,
num_groups
,
kernel_type
expected_m
,
n
,
k
,
num_groups
,
kernel_type
):
):
_grouped_gemm_nt_f8f8bf16_masked_raw
(
_grouped_gemm_nt_f8f8bf16_masked_raw
(
lhs
,
rhs
,
out
,
masked_m
,
expected_m
,
lhs
,
rhs
,
out
,
masked_m
,
expected_m
,
**
({
"recipe"
:
recipe
}
if
DEEPGEMM_V202506
else
{})
**
({
"recipe"
:
recipe
}
if
DEEPGEMM_V202506
else
{})
)
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment