Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
31d992d2
Unverified
Commit
31d992d2
authored
Feb 11, 2026
by
bnellnm
Committed by
GitHub
Feb 11, 2026
Browse files
[Bugfix] Fix some issues with MoERunner PR #32344 (#34371)
Signed-off-by:
Bill Nell
<
bnell@redhat.com
>
parent
5aff2699
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
6 additions
and
3 deletions
+6
-3
vllm/model_executor/layers/fused_moe/layer.py
vllm/model_executor/layers/fused_moe/layer.py
+2
-3
vllm/model_executor/layers/fused_moe/runner/default_moe_runner.py
...el_executor/layers/fused_moe/runner/default_moe_runner.py
+4
-0
No files found.
vllm/model_executor/layers/fused_moe/layer.py
View file @
31d992d2
...
@@ -700,7 +700,7 @@ class FusedMoE(CustomOp):
...
@@ -700,7 +700,7 @@ class FusedMoE(CustomOp):
@
property
@
property
def
gate
(
self
)
->
torch
.
nn
.
Module
|
None
:
def
gate
(
self
)
->
torch
.
nn
.
Module
|
None
:
return
self
.
_gate
return
self
.
_gate
if
self
.
use_overlapped
else
None
@
property
@
property
def
tp_size
(
self
):
def
tp_size
(
self
):
...
@@ -725,7 +725,7 @@ class FusedMoE(CustomOp):
...
@@ -725,7 +725,7 @@ class FusedMoE(CustomOp):
@
property
@
property
def
is_internal_router
(
self
)
->
bool
:
def
is_internal_router
(
self
)
->
bool
:
# By default, router/gate is called before FusedMoE forward pass
# By default, router/gate is called before FusedMoE forward pass
return
self
.
_
gate
is
not
None
return
self
.
gate
is
not
None
def
_maybe_init_expert_routing_tables
(
def
_maybe_init_expert_routing_tables
(
self
,
self
,
...
@@ -1457,7 +1457,6 @@ class FusedMoE(CustomOp):
...
@@ -1457,7 +1457,6 @@ class FusedMoE(CustomOp):
hidden_states
:
torch
.
Tensor
,
hidden_states
:
torch
.
Tensor
,
router_logits
:
torch
.
Tensor
,
router_logits
:
torch
.
Tensor
,
)
->
torch
.
Tensor
|
tuple
[
torch
.
Tensor
,
torch
.
Tensor
]:
)
->
torch
.
Tensor
|
tuple
[
torch
.
Tensor
,
torch
.
Tensor
]:
self
.
ensure_moe_quant_config_init
()
return
self
.
runner
.
forward
(
return
self
.
runner
.
forward
(
hidden_states
,
hidden_states
,
router_logits
,
router_logits
,
...
...
vllm/model_executor/layers/fused_moe/runner/default_moe_runner.py
View file @
31d992d2
...
@@ -63,6 +63,8 @@ def _moe_forward(
...
@@ -63,6 +63,8 @@ def _moe_forward(
layer_name
:
str
,
layer_name
:
str
,
)
->
torch
.
Tensor
:
)
->
torch
.
Tensor
:
layer
=
get_layer_from_name
(
layer_name
)
layer
=
get_layer_from_name
(
layer_name
)
# TODO(bnell): this can be removed after MK migration is complete.
layer
.
ensure_moe_quant_config_init
()
return
layer
.
runner
.
forward_impl
(
return
layer
.
runner
.
forward_impl
(
layer
,
hidden_states
,
router_logits
,
shared_experts_input
layer
,
hidden_states
,
router_logits
,
shared_experts_input
)
)
...
@@ -84,6 +86,8 @@ def _moe_forward_shared(
...
@@ -84,6 +86,8 @@ def _moe_forward_shared(
layer_name
:
str
,
layer_name
:
str
,
)
->
tuple
[
torch
.
Tensor
,
torch
.
Tensor
]:
)
->
tuple
[
torch
.
Tensor
,
torch
.
Tensor
]:
layer
=
get_layer_from_name
(
layer_name
)
layer
=
get_layer_from_name
(
layer_name
)
# TODO(bnell): this can be removed after MK migration is complete.
layer
.
ensure_moe_quant_config_init
()
return
layer
.
runner
.
forward_impl
(
return
layer
.
runner
.
forward_impl
(
layer
,
hidden_states
,
router_logits
,
shared_experts_input
layer
,
hidden_states
,
router_logits
,
shared_experts_input
)
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment