Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
be874c02
Unverified
Commit
be874c02
authored
Sep 20, 2025
by
Roger Wang
Committed by
GitHub
Sep 20, 2025
Browse files
[Bugfix] Fix Qwen3-VL-MoE weight loading for EP (#25300)
Signed-off-by:
Roger Wang
<
hey@rogerw.io
>
parent
9607d5eb
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
7 additions
and
5 deletions
+7
-5
vllm/model_executor/models/qwen3_vl_moe.py
vllm/model_executor/models/qwen3_vl_moe.py
+7
-5
No files found.
vllm/model_executor/models/qwen3_vl_moe.py
View file @
be874c02
...
@@ -122,9 +122,10 @@ class Qwen3MoeLLMModel(Qwen3MoeModel):
...
@@ -122,9 +122,10 @@ class Qwen3MoeLLMModel(Qwen3MoeModel):
def
load_fused_expert_weights
(
self
,
name
:
str
,
params_dict
:
dict
,
def
load_fused_expert_weights
(
self
,
name
:
str
,
params_dict
:
dict
,
loaded_weight
:
torch
.
Tensor
,
shard_id
:
str
,
loaded_weight
:
torch
.
Tensor
,
shard_id
:
str
,
num_experts
:
int
):
num_experts
:
int
)
->
bool
:
param
=
params_dict
[
name
]
param
=
params_dict
[
name
]
weight_loader
=
typing
.
cast
(
Callable
[...,
bool
],
param
.
weight_loader
)
weight_loader
=
typing
.
cast
(
Callable
[...,
bool
],
param
.
weight_loader
)
loaded_local_expert
=
False
for
expert_id
in
range
(
num_experts
):
for
expert_id
in
range
(
num_experts
):
curr_expert_weight
=
loaded_weight
[
expert_id
]
curr_expert_weight
=
loaded_weight
[
expert_id
]
success
=
weight_loader
(
param
,
success
=
weight_loader
(
param
,
...
@@ -133,9 +134,10 @@ class Qwen3MoeLLMModel(Qwen3MoeModel):
...
@@ -133,9 +134,10 @@ class Qwen3MoeLLMModel(Qwen3MoeModel):
shard_id
,
shard_id
,
expert_id
,
expert_id
,
return_success
=
True
)
return_success
=
True
)
if
not
success
:
if
success
:
return
False
loaded_local_expert
=
True
return
True
return
loaded_local_expert
def
load_weights
(
self
,
weights
:
Iterable
[
tuple
[
str
,
def
load_weights
(
self
,
weights
:
Iterable
[
tuple
[
str
,
torch
.
Tensor
]])
->
set
[
str
]:
torch
.
Tensor
]])
->
set
[
str
]:
...
@@ -345,4 +347,4 @@ class Qwen3VLMoeForConditionalGeneration(Qwen3VLForConditionalGeneration):
...
@@ -345,4 +347,4 @@ class Qwen3VLMoeForConditionalGeneration(Qwen3VLForConditionalGeneration):
for
_
in
range
(
self
.
deepstack_num_level
)
for
_
in
range
(
self
.
deepstack_num_level
)
]
if
self
.
use_deepstack
else
None
]
if
self
.
use_deepstack
else
None
self
.
visual_dim
=
config
.
vision_config
.
out_hidden_size
self
.
visual_dim
=
config
.
vision_config
.
out_hidden_size
self
.
multiscale_dim
=
self
.
visual_dim
*
self
.
deepstack_num_level
self
.
multiscale_dim
=
self
.
visual_dim
*
self
.
deepstack_num_level
\ No newline at end of file
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment