[Misc] Fix docstring of get_attn_backend (#5271)

c65146e7 · Woosuk Kwon · GitHub · 41ca62cf · c65146e7
Unverified Commit c65146e7 authored Jun 05, 2024 by Woosuk Kwon Committed by GitHub Jun 05, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 3 deletions

vllm/attention/selector.py vllm/attention/selector.py +2 -3

No files found.
--- a/vllm/attention/selector.py
+++ b/vllm/attention/selector.py
@@ -31,15 +31,14 @@ def get_attn_backend(
    block_size: int,
    is_blocksparse: bool = False,
 ) -> Type[AttentionBackend]:
+    """Selects which attention backend to use and lazily imports it."""
    if is_blocksparse:
        logger.info("Using BlocksparseFlashAttention backend.")
        from vllm.attention.backends.blocksparse_attn import (
            BlocksparseFlashAttentionBackend)
        return BlocksparseFlashAttentionBackend
-    """Determine which attention backend to use and only import
-    the selected backend module.
-    """
    backend = which_attn_to_use(num_heads, head_size, num_kv_heads,
                                sliding_window, dtype, kv_cache_dtype,
                                block_size)