Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
eb5ed207
Unverified
Commit
eb5ed207
authored
Feb 04, 2026
by
Michael Goin
Committed by
GitHub
Feb 04, 2026
Browse files
[Bugfix] Define router_logits_dtype for remaining MoE models (#33737)
Signed-off-by:
mgoin
<
mgoin64@gmail.com
>
parent
26471636
Changes
6
Hide whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
9 additions
and
4 deletions
+9
-4
vllm/model_executor/models/afmoe.py
vllm/model_executor/models/afmoe.py
+1
-0
vllm/model_executor/models/bailing_moe.py
vllm/model_executor/models/bailing_moe.py
+1
-0
vllm/model_executor/models/flex_olmo.py
vllm/model_executor/models/flex_olmo.py
+1
-1
vllm/model_executor/models/longcat_flash.py
vllm/model_executor/models/longcat_flash.py
+4
-3
vllm/model_executor/models/mimo_v2_flash.py
vllm/model_executor/models/mimo_v2_flash.py
+1
-0
vllm/model_executor/models/step3p5.py
vllm/model_executor/models/step3p5.py
+1
-0
No files found.
vllm/model_executor/models/afmoe.py
View file @
eb5ed207
...
...
@@ -142,6 +142,7 @@ class AfmoeMoE(nn.Module):
e_score_correction_bias
=
self
.
expert_bias
,
enable_eplb
=
self
.
enable_eplb
,
num_redundant_experts
=
self
.
n_redundant_experts
,
router_logits_dtype
=
torch
.
float32
,
)
def
forward
(
self
,
hidden_states
:
torch
.
Tensor
)
->
torch
.
Tensor
:
...
...
vllm/model_executor/models/bailing_moe.py
View file @
eb5ed207
...
...
@@ -300,6 +300,7 @@ class BailingMoE(nn.Module):
num_expert_group
=
self
.
n_group
,
topk_group
=
self
.
topk_group
,
use_grouped_topk
=
self
.
use_grouped_topk
,
router_logits_dtype
=
self
.
router_dtype
,
)
def
forward
(
self
,
hidden_states
:
torch
.
Tensor
)
->
torch
.
Tensor
:
...
...
vllm/model_executor/models/flex_olmo.py
View file @
eb5ed207
...
...
@@ -71,7 +71,6 @@ class FlexOlmoMoE(nn.Module):
prefix
=
f
"
{
prefix
}
.gate"
,
)
# Gate always runs at half / full precision for now.
self
.
experts
=
FusedMoE
(
num_experts
=
hf_config
.
num_experts
,
top_k
=
hf_config
.
num_experts_per_tok
,
...
...
@@ -82,6 +81,7 @@ class FlexOlmoMoE(nn.Module):
quant_config
=
None
,
tp_size
=
tp_size
,
prefix
=
f
"
{
prefix
}
.experts"
,
router_logits_dtype
=
torch
.
float32
,
)
self
.
top_k
=
hf_config
.
num_experts_per_tok
...
...
vllm/model_executor/models/longcat_flash.py
View file @
eb5ed207
...
...
@@ -236,9 +236,9 @@ class FlashMLP(nn.Module):
class
LongcatRouter
(
nn
.
Module
):
def
__init__
(
self
,
config
,
zero_expert_num
=
0
,
rounter_params_dtype
=
torch
.
bfloat16
,
config
:
FlashConfig
,
zero_expert_num
:
int
,
rounter_params_dtype
:
torch
.
dtype
,
prefix
:
str
=
""
,
):
super
().
__init__
()
...
...
@@ -309,6 +309,7 @@ class LongcatMoe(nn.Module):
prefix
=
f
"
{
prefix
}
.experts"
,
enable_eplb
=
enable_eplb
,
routed_scaling_factor
=
config
.
routed_scaling_factor
,
router_logits_dtype
=
self
.
rounter_params_dtype
,
)
def
forward
(
self
,
hidden_states
:
torch
.
Tensor
)
->
torch
.
Tensor
:
...
...
vllm/model_executor/models/mimo_v2_flash.py
View file @
eb5ed207
...
...
@@ -174,6 +174,7 @@ class MiMoV2MoE(nn.Module):
num_expert_group
=
config
.
n_group
,
topk_group
=
config
.
topk_group
,
scoring_func
=
"sigmoid"
,
router_logits_dtype
=
self
.
gate_dtype
,
)
def
forward
(
self
,
hidden_states
:
torch
.
Tensor
)
->
torch
.
Tensor
:
...
...
vllm/model_executor/models/step3p5.py
View file @
eb5ed207
...
...
@@ -388,6 +388,7 @@ class FusedMoEBlock(nn.Module):
routed_scaling_factor
=
config
.
moe_router_scaling_factor
,
enable_eplb
=
self
.
enable_eplb
,
num_redundant_experts
=
self
.
n_redundant_experts
,
router_logits_dtype
=
torch
.
float32
,
)
def
forward
(
self
,
hidden_states
:
torch
.
Tensor
)
->
torch
.
Tensor
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment