Unverified Commit 388c05d5 authored by yhyang201's avatar yhyang201 Committed by GitHub
Browse files

Fix bias handling in TritonMoeQuantInfo within quantization/mxfp4.py (#10579)

parent fc809665
......@@ -731,8 +731,8 @@ class Mxfp4MoEMethod(FusedMoEMethodBase):
quant_info = TritonMoeQuantInfo(
w13_weight=layer.w13_weight,
w2_weight=layer.w2_weight,
w13_weight_bias=layer.w13_weight_bias,
w2_weight_bias=layer.w2_weight_bias,
b13=getattr(layer, "w13_weight_bias", None),
b2=getattr(layer, "w2_weight_bias", None),
)
return self.runner.run(dispatch_output, quant_info)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment