Unverified Commit 54aecd9e authored by Harry Mellor's avatar Harry Mellor Committed by GitHub
Browse files

Fix pre-commit (and XPU) on `main` (#28556)


Signed-off-by: default avatarHarry Mellor <19981378+hmellor@users.noreply.github.com>
parent 10138c92
...@@ -1145,7 +1145,7 @@ class IpexMxfp4MoEMethod(Mxfp4MoEMethod): ...@@ -1145,7 +1145,7 @@ class IpexMxfp4MoEMethod(Mxfp4MoEMethod):
) -> torch.Tensor: ) -> torch.Tensor:
assert activation == "swigluoai", ( assert activation == "swigluoai", (
"Only swiglu_oai activation is supported for IPEX MXFP4 MoE" "Only swiglu_oai activation is supported for IPEX MXFP4 MoE"
) # noqa: )
hidden_size_pad = round_up(self.original_hidden_size, 128) hidden_size_pad = round_up(self.original_hidden_size, 128)
x_pad = torch.nn.functional.pad(x, (0, hidden_size_pad - x.size(-1))) x_pad = torch.nn.functional.pad(x, (0, hidden_size_pad - x.size(-1)))
hidden_states = layer.ipex_fusion( hidden_states = layer.ipex_fusion(
......
...@@ -64,8 +64,6 @@ class XPUPlatform(Platform): ...@@ -64,8 +64,6 @@ class XPUPlatform(Platform):
if use_sparse: if use_sparse:
raise NotImplementedError("Sparse Attention is not supported on XPU.") raise NotImplementedError("Sparse Attention is not supported on XPU.")
if not use_v1:
raise ValueError("XPU backend only supports V1.")
if selected_backend == AttentionBackendEnum.TRITON_ATTN: if selected_backend == AttentionBackendEnum.TRITON_ATTN:
logger.info_once("Using Triton backend.") logger.info_once("Using Triton backend.")
return AttentionBackendEnum.TRITON_ATTN.get_path() return AttentionBackendEnum.TRITON_ATTN.get_path()
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment