"src/vscode:/vscode.git/clone" did not exist on "358bd2a0104d3b06a39433042df9578bdbcf944c"
Unverified Commit f0f13701 authored by gushiqiao's avatar gushiqiao Committed by GitHub
Browse files
parent efe5d2be
......@@ -597,7 +597,7 @@ class MMWeightWfp8channelAfp8channeldynamicVllm(MMWeightQuantTemplate):
self.weight,
input_tensor_scale,
self.weight_scale,
self.bias,
self.bias if self.bias is not None else None,
)
return output_tensor
......@@ -632,7 +632,7 @@ class MMWeightWint8channelAint8channeldynamicVllm(MMWeightQuantTemplate):
self.weight,
input_tensor_scale,
self.weight_scale,
self.bias,
self.bias if self.bias is not None else None,
)
return output_tensor
......@@ -823,7 +823,7 @@ class MMWeightWfp8channelAfp8channeldynamicQ8F(MMWeightQuantTemplate):
output_tensor = Q8F.linear.fp8_linear(
input_tensor_quant,
self.weight,
self.bias.float(),
self.bias.float() if self.bias is not None else None,
input_tensor_scale,
self.weight_scale,
out_dtype=self.infer_dtype,
......@@ -853,7 +853,7 @@ class MMWeightWint8channelAint8channeldynamicQ8F(MMWeightQuantTemplate):
output_tensor = Q8F.linear.q8_linear(
input_tensor_quant,
self.weight,
self.bias.float(),
self.bias.float() if self.bias is not None else None,
input_tensor_scale,
self.weight_scale,
fuse_gelu=False,
......@@ -956,7 +956,7 @@ class MMWeightWint8channelAint8channeldynamicSglActVllm(MMWeightQuantTemplate):
input_tensor_scale,
self.weight_scale,
self.infer_dtype,
self.bias,
self.bias if self.bias is not None else None,
)
return output_tensor
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment