Unverified Commit 357d435c authored by Wentao Ye's avatar Wentao Ye Committed by GitHub
Browse files
parent 108a2728
...@@ -930,8 +930,8 @@ class FlashMLASparseImpl(MLACommonBaseImpl[FlashMLASparseMetadata]): ...@@ -930,8 +930,8 @@ class FlashMLASparseImpl(MLACommonBaseImpl[FlashMLASparseMetadata]):
if self.num_heads % self.padding != 0: if self.num_heads % self.padding != 0:
assert self.padding % self.num_heads == 0 assert self.padding % self.num_heads == 0
logger.warning_once( logger.warning_once(
f"padding num_heads to {self.padding} \ f"padding num_heads to {self.padding} due to sparse attn "
due to sparse attn kernel requirement" "kernel requirement"
) )
q_padded = q.new_empty((q.shape[0], self.padding, q.shape[2])) q_padded = q.new_empty((q.shape[0], self.padding, q.shape[2]))
q_padded[:, : self.num_heads, :] = q q_padded[:, : self.num_heads, :] = q
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment