Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
2f186635
Unverified
Commit
2f186635
authored
Feb 14, 2026
by
Roger Wang
Committed by
GitHub
Feb 14, 2026
Browse files
[Bugfix] Fix Qwen3.5 config loading (#34554)
Signed-off-by:
Roger Wang
<
hey@rogerw.io
>
parent
342a7cda
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
18 additions
and
10 deletions
+18
-10
vllm/transformers_utils/configs/qwen3_5.py
vllm/transformers_utils/configs/qwen3_5.py
+9
-5
vllm/transformers_utils/configs/qwen3_5_moe.py
vllm/transformers_utils/configs/qwen3_5_moe.py
+9
-5
No files found.
vllm/transformers_utils/configs/qwen3_5.py
View file @
2f186635
...
@@ -72,10 +72,6 @@ class Qwen3_5TextConfig(PretrainedConfig):
...
@@ -72,10 +72,6 @@ class Qwen3_5TextConfig(PretrainedConfig):
"mrope_section"
,
"mrope_section"
,
"mrope_interleaved"
,
"mrope_interleaved"
,
]
]
self
.
pad_token_id
=
pad_token_id
self
.
bos_token_id
=
bos_token_id
self
.
eos_token_id
=
eos_token_id
self
.
tie_word_embeddings
=
tie_word_embeddings
self
.
vocab_size
=
vocab_size
self
.
vocab_size
=
vocab_size
self
.
max_position_embeddings
=
max_position_embeddings
self
.
max_position_embeddings
=
max_position_embeddings
self
.
hidden_size
=
hidden_size
self
.
hidden_size
=
hidden_size
...
@@ -111,6 +107,13 @@ class Qwen3_5TextConfig(PretrainedConfig):
...
@@ -111,6 +107,13 @@ class Qwen3_5TextConfig(PretrainedConfig):
self
.
linear_num_key_heads
=
linear_num_key_heads
self
.
linear_num_key_heads
=
linear_num_key_heads
self
.
linear_num_value_heads
=
linear_num_value_heads
self
.
linear_num_value_heads
=
linear_num_value_heads
super
().
__init__
(
**
kwargs
)
super
().
__init__
(
**
kwargs
)
# Set these AFTER super().__init__() because transformers v4's
# PretrainedConfig.__init__ has these as explicit params with different
# defaults (e.g. tie_word_embeddings=True) that would overwrite our values.
self
.
pad_token_id
=
pad_token_id
self
.
bos_token_id
=
bos_token_id
self
.
eos_token_id
=
eos_token_id
self
.
tie_word_embeddings
=
tie_word_embeddings
class
Qwen3_5VisionConfig
(
PretrainedConfig
):
class
Qwen3_5VisionConfig
(
PretrainedConfig
):
...
@@ -182,8 +185,9 @@ class Qwen3_5Config(PretrainedConfig):
...
@@ -182,8 +185,9 @@ class Qwen3_5Config(PretrainedConfig):
self
.
video_token_id
=
video_token_id
self
.
video_token_id
=
video_token_id
self
.
vision_start_token_id
=
vision_start_token_id
self
.
vision_start_token_id
=
vision_start_token_id
self
.
vision_end_token_id
=
vision_end_token_id
self
.
vision_end_token_id
=
vision_end_token_id
self
.
tie_word_embeddings
=
tie_word_embeddings
super
().
__init__
(
**
kwargs
)
super
().
__init__
(
**
kwargs
)
# Set after super().__init__() to avoid v4 PretrainedConfig overwrite
self
.
tie_word_embeddings
=
tie_word_embeddings
__all__
=
[
"Qwen3_5Config"
,
"Qwen3_5TextConfig"
]
__all__
=
[
"Qwen3_5Config"
,
"Qwen3_5TextConfig"
]
vllm/transformers_utils/configs/qwen3_5_moe.py
View file @
2f186635
...
@@ -79,10 +79,6 @@ class Qwen3_5MoeTextConfig(PretrainedConfig):
...
@@ -79,10 +79,6 @@ class Qwen3_5MoeTextConfig(PretrainedConfig):
"mrope_section"
,
"mrope_section"
,
"mrope_interleaved"
,
"mrope_interleaved"
,
]
]
self
.
pad_token_id
=
pad_token_id
self
.
bos_token_id
=
bos_token_id
self
.
eos_token_id
=
eos_token_id
self
.
tie_word_embeddings
=
tie_word_embeddings
self
.
vocab_size
=
vocab_size
self
.
vocab_size
=
vocab_size
self
.
max_position_embeddings
=
max_position_embeddings
self
.
max_position_embeddings
=
max_position_embeddings
self
.
hidden_size
=
hidden_size
self
.
hidden_size
=
hidden_size
...
@@ -123,6 +119,13 @@ class Qwen3_5MoeTextConfig(PretrainedConfig):
...
@@ -123,6 +119,13 @@ class Qwen3_5MoeTextConfig(PretrainedConfig):
self
.
output_router_logits
=
output_router_logits
self
.
output_router_logits
=
output_router_logits
self
.
router_aux_loss_coef
=
router_aux_loss_coef
self
.
router_aux_loss_coef
=
router_aux_loss_coef
super
().
__init__
(
**
kwargs
)
super
().
__init__
(
**
kwargs
)
# Set these AFTER super().__init__() because transformers v4's
# PretrainedConfig.__init__ has these as explicit params with different
# defaults (e.g. tie_word_embeddings=True) that would overwrite our values.
self
.
pad_token_id
=
pad_token_id
self
.
bos_token_id
=
bos_token_id
self
.
eos_token_id
=
eos_token_id
self
.
tie_word_embeddings
=
tie_word_embeddings
class
Qwen3_5MoeVisionConfig
(
PretrainedConfig
):
class
Qwen3_5MoeVisionConfig
(
PretrainedConfig
):
...
@@ -194,8 +197,9 @@ class Qwen3_5MoeConfig(PretrainedConfig):
...
@@ -194,8 +197,9 @@ class Qwen3_5MoeConfig(PretrainedConfig):
self
.
video_token_id
=
video_token_id
self
.
video_token_id
=
video_token_id
self
.
vision_start_token_id
=
vision_start_token_id
self
.
vision_start_token_id
=
vision_start_token_id
self
.
vision_end_token_id
=
vision_end_token_id
self
.
vision_end_token_id
=
vision_end_token_id
self
.
tie_word_embeddings
=
tie_word_embeddings
super
().
__init__
(
**
kwargs
)
super
().
__init__
(
**
kwargs
)
# Set after super().__init__() to avoid v4 PretrainedConfig overwrite
self
.
tie_word_embeddings
=
tie_word_embeddings
__all__
=
[
"Qwen3_5MoeConfig"
,
"Qwen3_5MoeTextConfig"
]
__all__
=
[
"Qwen3_5MoeConfig"
,
"Qwen3_5MoeTextConfig"
]
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment