Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
zhaoyu6
sglang
Commits
349bb2c9
"vscode:/vscode.git/clone" did not exist on "4cb2cc62d245617fa178702df99852deccb3e15a"
Unverified
Commit
349bb2c9
authored
Jun 15, 2025
by
fzyzcjy
Committed by
GitHub
Jun 14, 2025
Browse files
Fix error when disabling new DeepGEMM (#7198)
parent
0b8939bc
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
8 additions
and
3 deletions
+8
-3
python/sglang/srt/layers/moe/ep_moe/token_dispatcher.py
python/sglang/srt/layers/moe/ep_moe/token_dispatcher.py
+4
-2
python/sglang/srt/models/deepseek_v2.py
python/sglang/srt/models/deepseek_v2.py
+4
-1
No files found.
python/sglang/srt/layers/moe/ep_moe/token_dispatcher.py
View file @
349bb2c9
...
@@ -584,8 +584,10 @@ class _DeepEPDispatcherImplLowLatency(_DeepEPDispatcherImplBase):
...
@@ -584,8 +584,10 @@ class _DeepEPDispatcherImplLowLatency(_DeepEPDispatcherImplBase):
use_fp8
=
use_fp8
,
use_fp8
=
use_fp8
,
async_finish
=
not
self
.
return_recv_hook
,
async_finish
=
not
self
.
return_recv_hook
,
return_recv_hook
=
self
.
return_recv_hook
,
return_recv_hook
=
self
.
return_recv_hook
,
round_scale
=
deep_gemm_wrapper
.
DEEPGEMM_V202506
,
round_scale
=
deep_gemm_wrapper
.
ENABLE_JIT_DEEPGEMM
use_ue8m0
=
deep_gemm_wrapper
.
DEEPGEMM_V202506
,
and
deep_gemm_wrapper
.
DEEPGEMM_V202506
,
use_ue8m0
=
deep_gemm_wrapper
.
ENABLE_JIT_DEEPGEMM
and
deep_gemm_wrapper
.
DEEPGEMM_V202506
,
)
)
)
)
return
packed_recv_hidden
,
packed_recv_count
,
event
,
hook
return
packed_recv_hidden
,
packed_recv_count
,
event
,
hook
...
...
python/sglang/srt/models/deepseek_v2.py
View file @
349bb2c9
...
@@ -1914,7 +1914,10 @@ class DeepseekV2ForCausalLM(nn.Module):
...
@@ -1914,7 +1914,10 @@ class DeepseekV2ForCausalLM(nn.Module):
self_attn
.
w_vc
=
bind_or_assign
(
self_attn
.
w_vc
,
w_vc
.
contiguous
())
self_attn
.
w_vc
=
bind_or_assign
(
self_attn
.
w_vc
,
w_vc
.
contiguous
())
self_attn
.
use_deep_gemm_bmm
=
True
self_attn
.
use_deep_gemm_bmm
=
True
if
deep_gemm_wrapper
.
DEEPGEMM_SCALE_UE8M0
:
if
(
deep_gemm_wrapper
.
ENABLE_JIT_DEEPGEMM
and
deep_gemm_wrapper
.
DEEPGEMM_SCALE_UE8M0
):
self
.
_weight_requant_ue8m0
()
self
.
_weight_requant_ue8m0
()
def
_weight_requant_ue8m0
(
self
):
def
_weight_requant_ue8m0
(
self
):
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment