Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
1072b724
Commit
1072b724
authored
Dec 23, 2025
by
zhuwenwen
Browse files
fix moe params and run error
parent
2461ea9d
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
3 additions
and
0 deletions
+3
-0
vllm/model_executor/layers/fused_moe/fused_moe.py
vllm/model_executor/layers/fused_moe/fused_moe.py
+2
-0
vllm/model_executor/layers/fused_moe/layer.py
vllm/model_executor/layers/fused_moe/layer.py
+1
-0
No files found.
vllm/model_executor/layers/fused_moe/fused_moe.py
View file @
1072b724
...
@@ -1655,6 +1655,7 @@ def fused_experts(
...
@@ -1655,6 +1655,7 @@ def fused_experts(
quant_config
:
FusedMoEQuantConfig
|
None
=
None
,
quant_config
:
FusedMoEQuantConfig
|
None
=
None
,
allow_deep_gemm
:
bool
=
False
,
allow_deep_gemm
:
bool
=
False
,
allow_cutlass_block_scaled_grouped_gemm
:
bool
=
False
,
allow_cutlass_block_scaled_grouped_gemm
:
bool
=
False
,
use_nn_moe
:
bool
|
None
=
False
,
)
->
torch
.
Tensor
:
)
->
torch
.
Tensor
:
if
quant_config
is
None
:
if
quant_config
is
None
:
quant_config
=
FUSED_MOE_UNQUANTIZED_CONFIG
quant_config
=
FUSED_MOE_UNQUANTIZED_CONFIG
...
@@ -1732,6 +1733,7 @@ def fused_experts(
...
@@ -1732,6 +1733,7 @@ def fused_experts(
block_shape
=
quant_config
.
block_shape
,
block_shape
=
quant_config
.
block_shape
,
w1_bias
=
quant_config
.
w1_bias
,
w1_bias
=
quant_config
.
w1_bias
,
w2_bias
=
quant_config
.
w2_bias
,
w2_bias
=
quant_config
.
w2_bias
,
use_nn_moe
=
use_nn_moe
,
)
)
...
...
vllm/model_executor/layers/fused_moe/layer.py
View file @
1072b724
...
@@ -1985,6 +1985,7 @@ class FusedMoE(CustomOp):
...
@@ -1985,6 +1985,7 @@ class FusedMoE(CustomOp):
if
do_naive_dispatch_combine
if
do_naive_dispatch_combine
else
hidden_states
,
else
hidden_states
,
router_logits
=
router_logits
,
router_logits
=
router_logits
,
use_nn_moe
=
self
.
use_nn_moe
,
)
)
if
has_separate_shared_experts
:
if
has_separate_shared_experts
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment