update log of seq_len

c7c03f73 · zhuwenwen · fa973559 · c7c03f73
Commit c7c03f73 authored Aug 19, 2024 by zhuwenwen
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

vllm/attention/backends/rocm_flash_attn.py vllm/attention/backends/rocm_flash_attn.py +1 -1

No files found.
--- a/vllm/attention/backends/rocm_flash_attn.py
+++ b/vllm/attention/backends/rocm_flash_attn.py
@@ -238,7 +238,7 @@ class ROCmFlashAttentionImpl(AttentionImpl):
                from flash_attn import flash_attn_varlen_func  # noqa: F401
                self.attn_func_ck = flash_attn_varlen_func
-                logger.debug("When SEQ_LEN > 8192, Use Triton FA in ROCmBackend, otherwise Use CK FA")
+                logger.debug("When SEQ_LEN > 8000, Use Triton FA in ROCmBackend, otherwise Use CK FA")
            else:
                # from vllm.attention.ops.triton_flash_attention import (  # noqa: F401
                #     triton_attention)