Commit 5973c805 authored by zhuwenwen's avatar zhuwenwen
Browse files

import concatv3Tritonfinal

parent 379315a0
...@@ -216,7 +216,7 @@ from vllm.v1.attention.backends.utils import (AttentionMetadataBuilder, ...@@ -216,7 +216,7 @@ from vllm.v1.attention.backends.utils import (AttentionMetadataBuilder,
CommonAttentionMetadata) CommonAttentionMetadata)
from vllm.v1.kv_cache_interface import AttentionSpec from vllm.v1.kv_cache_interface import AttentionSpec
from vllm.v1.worker.block_table import BlockTable from vllm.v1.worker.block_table import BlockTable
from concatv3Tritonfinal import concat_helper from vllm.v1.attention.backends.mla.concatv3Tritonfinal import concat_helper
try: try:
from vllm.vllm_flash_attn import flash_attn_varlen_func from vllm.vllm_flash_attn import flash_attn_varlen_func
......
...@@ -20,7 +20,7 @@ from vllm.v1.attention.backends.mla.common import (MLACommonBackend, ...@@ -20,7 +20,7 @@ from vllm.v1.attention.backends.mla.common import (MLACommonBackend,
from vllm.v1.kv_cache_interface import AttentionSpec from vllm.v1.kv_cache_interface import AttentionSpec
from vllm.v1.worker.block_table import BlockTable from vllm.v1.worker.block_table import BlockTable
from vllm import envs from vllm import envs
from concatv3Tritonfinal import concat_helper from vllm.v1.attention.backends.mla.concatv3Tritonfinal import concat_helper
logger = init_logger(__name__) logger = init_logger(__name__)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment