Unverified Commit ba09652d authored by JartX's avatar JartX Committed by GitHub
Browse files

[ROCM] Enable CompressedTensorsWNA16 (#27187)


Signed-off-by: default avatarJartX <sagformas@epdcenter.es>
parent bd66b852
......@@ -142,7 +142,10 @@ class CompressedTensorsMoEMethod(FusedMoEMethodBase):
# group_size=None means channelwise
group_size = weight_quant.group_size or -1
# Prefer to use the MarlinMoE kernel when it is supported.
if not check_moe_marlin_supports_layer(layer, group_size):
if (
not check_moe_marlin_supports_layer(layer, group_size)
or current_platform.is_rocm()
):
if (
weight_quant.strategy == QuantizationStrategy.GROUP
and weight_quant.actorder
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment