Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
55310f4f
"vscode:/vscode.git/clone" did not exist on "2991dd3d2241cb3b188a047282e58111684e0201"
Commit
55310f4f
authored
Dec 02, 2025
by
王敏
Browse files
[fix]回退错误修改,避免dp模式漏掉的dispatch和combine通信
parent
2ae2d013
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
2 additions
and
5 deletions
+2
-5
vllm/forward_context.py
vllm/forward_context.py
+1
-2
vllm/model_executor/layers/fused_moe/layer.py
vllm/model_executor/layers/fused_moe/layer.py
+1
-3
No files found.
vllm/forward_context.py
View file @
55310f4f
...
@@ -136,8 +136,7 @@ def set_forward_context(
...
@@ -136,8 +136,7 @@ def set_forward_context(
forward_start_time
=
time
.
perf_counter
()
forward_start_time
=
time
.
perf_counter
()
dp_metadata
:
Optional
[
DPMetadata
]
=
None
dp_metadata
:
Optional
[
DPMetadata
]
=
None
dp_size
=
vllm_config
.
parallel_config
.
data_parallel_size
dp_size
=
vllm_config
.
parallel_config
.
data_parallel_size
use_navie_ep
=
envs
.
VLLM_ALL2ALL_BACKEND
==
'naive'
and
dp_size
>
1
and
vllm_config
.
parallel_config
.
enable_expert_parallel
if
dp_size
>
1
and
(
if
use_navie_ep
and
dp_size
>
1
and
(
attn_metadata
is
not
None
or
num_tokens
is
not
None
):
attn_metadata
is
not
None
or
num_tokens
is
not
None
):
dp_metadata
=
DPMetadata
.
make
(
vllm_config
.
parallel_config
,
dp_metadata
=
DPMetadata
.
make
(
vllm_config
.
parallel_config
,
attn_metadata
,
num_tokens
or
0
,
attn_metadata
,
num_tokens
or
0
,
...
...
vllm/model_executor/layers/fused_moe/layer.py
View file @
55310f4f
...
@@ -1537,9 +1537,7 @@ class FusedMoE(torch.nn.Module):
...
@@ -1537,9 +1537,7 @@ class FusedMoE(torch.nn.Module):
do_naive_dispatch_combine
:
bool
=
(
do_naive_dispatch_combine
:
bool
=
(
self
.
dp_size
>
1
self
.
dp_size
>
1
and
self
.
ep_size
>
1
and
not
self
.
moe_parallel_config
.
use_deepep_ht_kernels
)
and
envs
.
VLLM_ALL2ALL_BACKEND
==
'naive'
)
#and not self.moe_parallel_config.use_deepep_ht_kernels)
if
do_naive_dispatch_combine
:
if
do_naive_dispatch_combine
:
hidden_states
,
router_logits
=
get_ep_group
().
dispatch
(
hidden_states
,
router_logits
=
get_ep_group
().
dispatch
(
hidden_states
,
router_logits
)
hidden_states
,
router_logits
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment