Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
b18416fb
"git@developer.sourcefind.cn:ox696c/ktransformers.git" did not exist on "107e4be41791c3f888051bb64e9ff91f0dab77f0"
Unverified
Commit
b18416fb
authored
May 27, 2025
by
Yi Zhang
Committed by
GitHub
May 27, 2025
Browse files
Fix qwen3 tbo/dp-lm-head (#6652)
parent
ce9d690e
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
3 additions
and
1 deletion
+3
-1
python/sglang/srt/models/qwen2_moe.py
python/sglang/srt/models/qwen2_moe.py
+1
-0
python/sglang/srt/models/qwen3_moe.py
python/sglang/srt/models/qwen3_moe.py
+1
-0
python/sglang/srt/two_batch_overlap.py
python/sglang/srt/two_batch_overlap.py
+1
-1
No files found.
python/sglang/srt/models/qwen2_moe.py
View file @
b18416fb
...
@@ -501,6 +501,7 @@ class Qwen2MoeForCausalLM(nn.Module):
...
@@ -501,6 +501,7 @@ class Qwen2MoeForCausalLM(nn.Module):
config
.
hidden_size
,
config
.
hidden_size
,
quant_config
=
quant_config
,
quant_config
=
quant_config
,
prefix
=
add_prefix
(
"lm_head"
,
prefix
),
prefix
=
add_prefix
(
"lm_head"
,
prefix
),
use_attn_tp_group
=
global_server_args_dict
[
"enable_dp_lm_head"
],
)
)
self
.
logits_processor
=
LogitsProcessor
(
config
)
self
.
logits_processor
=
LogitsProcessor
(
config
)
...
...
python/sglang/srt/models/qwen3_moe.py
View file @
b18416fb
...
@@ -688,6 +688,7 @@ class Qwen3MoeForCausalLM(nn.Module):
...
@@ -688,6 +688,7 @@ class Qwen3MoeForCausalLM(nn.Module):
config
.
hidden_size
,
config
.
hidden_size
,
quant_config
=
quant_config
,
quant_config
=
quant_config
,
prefix
=
add_prefix
(
"lm_head"
,
prefix
),
prefix
=
add_prefix
(
"lm_head"
,
prefix
),
use_attn_tp_group
=
global_server_args_dict
[
"enable_dp_lm_head"
],
)
)
self
.
logits_processor
=
LogitsProcessor
(
config
)
self
.
logits_processor
=
LogitsProcessor
(
config
)
...
...
python/sglang/srt/two_batch_overlap.py
View file @
b18416fb
...
@@ -370,7 +370,7 @@ def model_forward_maybe_tbo(
...
@@ -370,7 +370,7 @@ def model_forward_maybe_tbo(
hidden_states
=
hidden_states
,
hidden_states
=
hidden_states
,
forward_batch
=
forward_batch
,
forward_batch
=
forward_batch
,
residual
=
residual
,
residual
=
residual
,
**
(
dict
(
zero_allocator
=
zero_allocator
)
if
zero_allocator
is
not
None
else
{})
,
zero_allocator
=
zero_allocator
,
)
)
layer_input_scatter_mode
=
layers
[
0
].
layer_scatter_modes
.
layer_input_mode
layer_input_scatter_mode
=
layers
[
0
].
layer_scatter_modes
.
layer_input_mode
operations_strategy
=
OperationsStrategy
.
init_new_tbo
(
operations_strategy
=
OperationsStrategy
.
init_new_tbo
(
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment