Commit 35396f41 authored by zhuwenwen's avatar zhuwenwen
Browse files

skip rocm_aiter_mla

parent ebdb56e1
......@@ -178,13 +178,14 @@ class RocmPlatform(Platform):
kv_cache_dtype, block_size, use_v1,
use_mla) -> str:
if use_mla:
from vllm.attention.backends.rocm_aiter_mla import (
is_aiter_mla_enabled)
# from vllm.attention.backends.rocm_aiter_mla import (
# is_aiter_mla_enabled)
if selected_backend is None:
selected_backend = (_Backend.ROCM_AITER_MLA if
is_aiter_mla_enabled() or block_size == 1
else _Backend.TRITON_MLA)
# selected_backend = (_Backend.ROCM_AITER_MLA if
# is_aiter_mla_enabled() or block_size == 1
# else _Backend.TRITON_MLA)
selected_backend = _Backend.TRITON_MLA
if selected_backend == _Backend.TRITON_MLA:
if block_size != 1:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment