Unverified Commit 6409004b authored by vllmellm's avatar vllmellm Committed by GitHub
Browse files

[ROCm][AITER] bugfix accuracy regression in ROCM_AITER_TRITON_MLA backend (#31816)


Signed-off-by: default avatarvllmellm <vllm.ellm@embeddedllm.com>
parent aafd4d23
# SPDX-License-Identifier: Apache-2.0 # SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project # SPDX-FileCopyrightText: Copyright contributors to the vLLM project
from vllm.v1.attention.backends.mla.common import MLACommonBackend from vllm.v1.attention.backends.mla.rocm_aiter_mla import AiterMLABackend, AiterMLAImpl
from vllm.v1.attention.backends.mla.rocm_aiter_mla import (
AiterMLAImpl,
AiterMLAMetadataBuilder,
)
class AiterTritonMLABackend(MLACommonBackend): class AiterTritonMLABackend(AiterMLABackend):
@staticmethod @staticmethod
def get_name() -> str: def get_name() -> str:
return "AITER_TRITON_MLA" return "AITER_TRITON_MLA"
...@@ -16,10 +12,6 @@ class AiterTritonMLABackend(MLACommonBackend): ...@@ -16,10 +12,6 @@ class AiterTritonMLABackend(MLACommonBackend):
def get_impl_cls() -> type["AiterTritonMLAImpl"]: def get_impl_cls() -> type["AiterTritonMLAImpl"]:
return AiterTritonMLAImpl return AiterTritonMLAImpl
@staticmethod
def get_builder_cls() -> type["AiterMLAMetadataBuilder"]:
return AiterMLAMetadataBuilder
class AiterTritonMLAImpl(AiterMLAImpl): class AiterTritonMLAImpl(AiterMLAImpl):
def __init__( def __init__(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment