fix mlu int8 quant (#531)

1. 修复mlu int8量化

fix mlu int8 quant (#531)
1. 修复mlu int8量化
5be4fe5a · Kane · GitHub · f7665abb · 5be4fe5a
Unverified Commit 5be4fe5a authored Nov 28, 2025 by Kane Committed by GitHub Nov 28, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 1 deletion

lightx2v/common/ops/mm/mm_weight.py lightx2v/common/ops/mm/mm_weight.py +3 -1

No files found.
--- a/lightx2v/common/ops/mm/mm_weight.py
+++ b/lightx2v/common/ops/mm/mm_weight.py
@@ -1204,5 +1204,7 @@ class MMWeightWint8channelAint8channeldynamicMlu(MMWeightQuantTemplate):
    def apply(self, input_tensor):
        dtype = input_tensor.dtype
        input_tensor_quant, input_tensor_scale = self.act_quant_func(input_tensor)
-        output_tensor = tmo.scaled_matmul(input_tensor_quant, self.weight.contiguous(), input_tensor_scale, self.weight_scale.squeeze(-1), output_dtype=dtype, use_hp_active=True)
+        output_tensor = tmo.scaled_matmul(
+            input_tensor_quant, self.weight.contiguous(), input_tensor_scale, self.weight_scale.squeeze(-1), bias=self.bias if self.bias is not None else None, output_dtype=dtype, use_hp_active=True
+        )
        return output_tensor