Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
a258ad8b
Unverified
Commit
a258ad8b
authored
Aug 17, 2025
by
Jinzhen Lin
Committed by
GitHub
Aug 16, 2025
Browse files
[Bugfix] fix qwen3 moe fp8 accuracy issue (#23031)
Signed-off-by:
Jinzhen Lin
<
jinzhen.ljz@antgroup.com
>
parent
bf7f470b
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
4 additions
and
0 deletions
+4
-0
vllm/model_executor/layers/quantization/fp8.py
vllm/model_executor/layers/quantization/fp8.py
+4
-0
No files found.
vllm/model_executor/layers/quantization/fp8.py
View file @
a258ad8b
...
...
@@ -125,6 +125,10 @@ class Fp8Config(QuantizationConfig):
ignored_layers
=
cls
.
get_from_keys_or
(
config
,
[
"ignored_layers"
],
None
)
weight_block_size
=
cls
.
get_from_keys_or
(
config
,
[
"weight_block_size"
],
None
)
if
not
ignored_layers
:
ignored_layers
=
cls
.
get_from_keys_or
(
config
,
[
"modules_to_not_convert"
],
None
)
return
cls
(
is_checkpoint_fp8_serialized
=
is_checkpoint_fp8_serialized
,
activation_scheme
=
activation_scheme
,
ignored_layers
=
ignored_layers
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment