Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
9d6235ca
Unverified
Commit
9d6235ca
authored
Dec 08, 2025
by
Ming Yang
Committed by
GitHub
Dec 09, 2025
Browse files
[moe] Allow disabling DP chunking (#29936)
Signed-off-by:
Ming Yang
<
minos.future@gmail.com
>
parent
f1599ca5
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
5 additions
and
1 deletion
+5
-1
vllm/envs.py
vllm/envs.py
+4
-0
vllm/model_executor/layers/fused_moe/layer.py
vllm/model_executor/layers/fused_moe/layer.py
+1
-1
No files found.
vllm/envs.py
View file @
9d6235ca
...
...
@@ -144,6 +144,7 @@ if TYPE_CHECKING:
VLLM_DP_MASTER_IP
:
str
=
""
VLLM_DP_MASTER_PORT
:
int
=
0
VLLM_MOE_DP_CHUNK_SIZE
:
int
=
256
VLLM_ENABLE_MOE_DP_CHUNK
:
bool
=
True
VLLM_RANDOMIZE_DP_DUMMY_INPUTS
:
bool
=
False
VLLM_RAY_DP_PACK_STRATEGY
:
Literal
[
"strict"
,
"fill"
,
"span"
]
=
"strict"
VLLM_MARLIN_USE_ATOMIC_ADD
:
bool
=
False
...
...
@@ -1101,6 +1102,9 @@ environment_variables: dict[str, Callable[[], Any]] = {
# rank. All DP ranks process the activations in VLLM_MOE_DP_CHUNK_SIZE
# units.
"VLLM_MOE_DP_CHUNK_SIZE"
:
lambda
:
int
(
os
.
getenv
(
"VLLM_MOE_DP_CHUNK_SIZE"
,
"256"
)),
"VLLM_ENABLE_MOE_DP_CHUNK"
:
lambda
:
bool
(
int
(
os
.
getenv
(
"VLLM_ENABLE_MOE_DP_CHUNK"
,
"1"
))
),
# Randomize inputs during dummy runs when using Data Parallel
"VLLM_RANDOMIZE_DP_DUMMY_INPUTS"
:
lambda
:
os
.
environ
.
get
(
"VLLM_RANDOMIZE_DP_DUMMY_INPUTS"
,
"0"
...
...
vllm/model_executor/layers/fused_moe/layer.py
View file @
9d6235ca
...
...
@@ -753,7 +753,7 @@ class FusedMoE(CustomOp):
self
.
moe_parallel_config
.
use_pplx_kernels
or
self
.
moe_parallel_config
.
use_deepep_ll_kernels
or
(
self
.
dp_size
>
1
and
self
.
use_flashinfer_cutlass_kernels
)
)
)
and
envs
.
VLLM_ENABLE_MOE_DP_CHUNK
@
property
def
is_internal_router
(
self
)
->
bool
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment