Update _custom_ops.py

495606d4 · gaoqiong · 7ef78993 · 495606d4
Commit 495606d4 authored Dec 19, 2024 by gaoqiong
Show whitespace changes
Inline Side-by-side

Showing with 3 additions and 2 deletions

vllm/_custom_ops.py vllm/_custom_ops.py +3 -2

No files found.
--- a/vllm/_custom_ops.py
+++ b/vllm/_custom_ops.py
@@ -906,9 +906,10 @@ def triton_scaled_mm(a: torch.Tensor,
                      scale_a: torch.Tensor,
                      scale_b: torch.Tensor,
                      out_dtype: torch.dtype,
-                      bias: Optional[torch.Tensor] = None) -> torch.Tensor:
+                      bias: Optional[torch.Tensor] = None,
+                      best_config:Optional[list] = None) -> torch.Tensor:

-    return quant_ops.triton_scaled_mm(a, b,scale_a,scale_b,out_dtype,bias)
+    return quant_ops.triton_scaled_mm(a, b,scale_a,scale_b,out_dtype,bias,best_config)

 def triton_int8_gemm_helper(m: int,
                             n: int,