Fixes an error in comment (#785)

Signed-off-by: Tao He <sighingnow@gmail.com>

Fixes an error in comment (#785)
Signed-off-by: Tao He <sighingnow@gmail.com>
204c3c6d · Tao He · GitHub · 197f2083 · 204c3c6d · 204c3c6d
Unverified Commit 204c3c6d authored Jan 24, 2024 by Tao He Committed by GitHub Jan 23, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

README.md README.md +1 -1

flash_attn/flash_attn_interface.py flash_attn/flash_attn_interface.py +1 -1

No files found.
--- a/README.md
+++ b/README.md
@@ -212,7 +212,7 @@ def flash_attn_with_kvcache(
        rotary_sin [optional]: (seqlen_ro, rotary_dim / 2). Similar to rotary_cos.
        cache_seqlens: int, or (batch_size,), dtype torch.int32. The sequence lengths of the
            KV cache.
-        block_table [optional]: (num_blocks, max_num_blocks_per_seq), dtype torch.int32.
+        block_table [optional]: (batch_size, max_num_blocks_per_seq), dtype torch.int32.
        cache_batch_idx: (batch_size,), dtype torch.int32. The indices used to index into the KV cache.
            If None, we assume that the batch indices are [0, 1, 2, ..., batch_size - 1].
            If the indices are not distinct, and k and v are provided, the values updated in the cache

--- a/flash_attn/flash_attn_interface.py
+++ b/flash_attn/flash_attn_interface.py
@@ -1149,7 +1149,7 @@ def flash_attn_with_kvcache(
        rotary_sin [optional]: (seqlen_ro, rotary_dim / 2). Similar to rotary_cos.
        cache_seqlens: int, or (batch_size,), dtype torch.int32. The sequence lengths of the
            KV cache.
-        block_table [optional]: (num_blocks, max_num_blocks_per_seq), dtype torch.int32.
+        block_table [optional]: (batch_size, max_num_blocks_per_seq), dtype torch.int32.
        cache_batch_idx: (batch_size,), dtype torch.int32. The indices used to index into the KV cache.
            If None, we assume that the batch indices are [0, 1, 2, ..., batch_size - 1].
            If the indices are not distinct, and k and v are provided, the values updated in the cache