Commit 49be5e62 authored by zhuwenwen's avatar zhuwenwen
Browse files

update rocm_flash_attn.py

parent db561fb6
...@@ -189,7 +189,7 @@ class ROCmFlashAttentionMetadata(AttentionMetadata, PagedAttentionMetadata): ...@@ -189,7 +189,7 @@ class ROCmFlashAttentionMetadata(AttentionMetadata, PagedAttentionMetadata):
encoder_seq_lens_tensor=self.encoder_seq_lens_tensor, encoder_seq_lens_tensor=self.encoder_seq_lens_tensor,
max_encoder_seq_len=self.max_encoder_seq_len, max_encoder_seq_len=self.max_encoder_seq_len,
cross_slot_mapping=self.cross_slot_mapping, cross_slot_mapping=self.cross_slot_mapping,
cross_block_tables=self.cross_block_tables cross_block_tables=self.cross_block_tables,
tree_attention_masks_tensor=self.tree_attention_masks_tensor, tree_attention_masks_tensor=self.tree_attention_masks_tensor,
block_tables_list=self.block_tables_list) block_tables_list=self.block_tables_list)
return self._cached_prefill_metadata return self._cached_prefill_metadata
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment