"vscode:/vscode.git/clone" did not exist on "e97f802b2d74861af77997691a7d1c36498f6dca"
Unverified Commit a5ccc85c authored by Samu Tamminen's avatar Samu Tamminen Committed by GitHub
Browse files

[Bugfix] Fix Dynamo unexpected keyword argument (#34320)


Signed-off-by: default avatarSamu Tamminen <stammine@amd.com>
Co-authored-by: default avatarWentao Ye <44945378+yewentao256@users.noreply.github.com>
parent b5475d05
...@@ -85,7 +85,7 @@ class QuantFP8(CustomOp): ...@@ -85,7 +85,7 @@ class QuantFP8(CustomOp):
x: torch.Tensor, x: torch.Tensor,
scale: torch.Tensor | None = None, scale: torch.Tensor | None = None,
scale_ub: torch.Tensor | None = None, scale_ub: torch.Tensor | None = None,
**kwargs, use_triton: bool = False,
) -> tuple[torch.Tensor, torch.Tensor]: ) -> tuple[torch.Tensor, torch.Tensor]:
from vllm.model_executor.layers.quantization.utils import fp8_utils from vllm.model_executor.layers.quantization.utils import fp8_utils
...@@ -135,9 +135,8 @@ class QuantFP8(CustomOp): ...@@ -135,9 +135,8 @@ class QuantFP8(CustomOp):
x: torch.Tensor, x: torch.Tensor,
scale: torch.Tensor | None = None, scale: torch.Tensor | None = None,
scale_ub: torch.Tensor | None = None, scale_ub: torch.Tensor | None = None,
**kwargs, use_triton: bool = False,
) -> tuple[torch.Tensor, torch.Tensor]: ) -> tuple[torch.Tensor, torch.Tensor]:
use_triton = kwargs.get("use_triton", False)
if self.is_group_quant and use_triton: if self.is_group_quant and use_triton:
assert scale is None, "Dynamic group quantization does not use scale" assert scale is None, "Dynamic group quantization does not use scale"
...@@ -171,6 +170,7 @@ class QuantFP8(CustomOp): ...@@ -171,6 +170,7 @@ class QuantFP8(CustomOp):
x: torch.Tensor, x: torch.Tensor,
scale: torch.Tensor | None = None, scale: torch.Tensor | None = None,
scale_ub: torch.Tensor | None = None, scale_ub: torch.Tensor | None = None,
use_triton: bool = False,
): ):
if self.is_group_quant and not self.static: if self.is_group_quant and not self.static:
assert scale is None, "Dynamic group quantization does not use scale" assert scale is None, "Dynamic group quantization does not use scale"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment