"tests/kernels/attention/test_cache.py" did not exist on "14dbd5a7674e5de2862c18adb711d9feecd35063"
Unverified Commit 357d435c authored by Wentao Ye's avatar Wentao Ye Committed by GitHub
Browse files
parent 108a2728
......@@ -930,8 +930,8 @@ class FlashMLASparseImpl(MLACommonBaseImpl[FlashMLASparseMetadata]):
if self.num_heads % self.padding != 0:
assert self.padding % self.num_heads == 0
logger.warning_once(
f"padding num_heads to {self.padding} \
due to sparse attn kernel requirement"
f"padding num_heads to {self.padding} due to sparse attn "
"kernel requirement"
)
q_padded = q.new_empty((q.shape[0], self.padding, q.shape[2]))
q_padded[:, : self.num_heads, :] = q
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment