Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
ebd0a17e
Unverified
Commit
ebd0a17e
authored
Jan 23, 2026
by
joninco
Committed by
GitHub
Jan 23, 2026
Browse files
[Bugfix] Fix missing is_layer_skipped check for FusedMoE in AWQConfig (#32935)
Signed-off-by:
jon
<
joninco@bullpoint.org
>
parent
37c9859f
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
3 additions
and
2 deletions
+3
-2
vllm/model_executor/layers/quantization/awq.py
vllm/model_executor/layers/quantization/awq.py
+3
-2
No files found.
vllm/model_executor/layers/quantization/awq.py
View file @
ebd0a17e
...
@@ -106,7 +106,7 @@ class AWQConfig(QuantizationConfig):
...
@@ -106,7 +106,7 @@ class AWQConfig(QuantizationConfig):
return
AWQLinearMethod
(
self
)
return
AWQLinearMethod
(
self
)
elif
isinstance
(
layer
,
FusedMoE
):
elif
isinstance
(
layer
,
FusedMoE
):
# Lazy import to avoid circular import.
# Lazy import to avoid circular import.
from
.awq_marlin
import
AWQMarlinConfig
,
AWQMarlinMoEMethod
from
.awq_marlin
import
AWQMarlinConfig
from
.moe_wna16
import
MoeWNA16Config
from
.moe_wna16
import
MoeWNA16Config
from
.utils.marlin_utils
import
check_moe_marlin_supports_layer
from
.utils.marlin_utils
import
check_moe_marlin_supports_layer
...
@@ -121,6 +121,7 @@ class AWQConfig(QuantizationConfig):
...
@@ -121,6 +121,7 @@ class AWQConfig(QuantizationConfig):
"group_size"
:
self
.
group_size
,
"group_size"
:
self
.
group_size
,
"zero_point"
:
self
.
zero_point
,
"zero_point"
:
self
.
zero_point
,
"lm_head"
:
False
,
"lm_head"
:
False
,
"modules_to_not_convert"
:
self
.
modules_to_not_convert
,
}
}
return
MoeWNA16Config
.
from_config
(
config
).
get_quant_method
(
return
MoeWNA16Config
.
from_config
(
config
).
get_quant_method
(
layer
,
prefix
layer
,
prefix
...
@@ -136,7 +137,7 @@ class AWQConfig(QuantizationConfig):
...
@@ -136,7 +137,7 @@ class AWQConfig(QuantizationConfig):
awq_marlin_config
=
AWQMarlinConfig
.
from_config
(
awq_marlin_config
=
AWQMarlinConfig
.
from_config
(
marlin_compatible_config_dict
marlin_compatible_config_dict
)
)
return
AWQMarlinMoEMethod
(
awq_marlin_config
,
layer
.
moe_con
fi
g
)
return
awq_marlin_config
.
get_quant_method
(
layer
,
pre
fi
x
)
return
None
return
None
def
apply_vllm_mapper
(
self
,
hf_to_vllm_mapper
:
"WeightsMapper"
):
def
apply_vllm_mapper
(
self
,
hf_to_vllm_mapper
:
"WeightsMapper"
):
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment