Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
160c6fa3
Unverified
Commit
160c6fa3
authored
Jan 23, 2026
by
Nicolò Lucchesi
Committed by
GitHub
Jan 23, 2026
Browse files
[Misc] Add `get_name` to missing AttentionBackends (#32698)
Signed-off-by:
NickLucche
<
nlucches@redhat.com
>
parent
a8eb1182
Changes
6
Hide whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
28 additions
and
1 deletion
+28
-1
vllm/v1/attention/backends/gdn_attn.py
vllm/v1/attention/backends/gdn_attn.py
+4
-0
vllm/v1/attention/backends/linear_attn.py
vllm/v1/attention/backends/linear_attn.py
+4
-0
vllm/v1/attention/backends/mamba1_attn.py
vllm/v1/attention/backends/mamba1_attn.py
+4
-0
vllm/v1/attention/backends/mamba2_attn.py
vllm/v1/attention/backends/mamba2_attn.py
+8
-1
vllm/v1/attention/backends/mla/indexer.py
vllm/v1/attention/backends/mla/indexer.py
+4
-0
vllm/v1/attention/backends/short_conv_attn.py
vllm/v1/attention/backends/short_conv_attn.py
+4
-0
No files found.
vllm/v1/attention/backends/gdn_attn.py
View file @
160c6fa3
...
@@ -22,6 +22,10 @@ from vllm.v1.kv_cache_interface import AttentionSpec, MambaSpec
...
@@ -22,6 +22,10 @@ from vllm.v1.kv_cache_interface import AttentionSpec, MambaSpec
class
GDNAttentionBackend
(
AttentionBackend
):
class
GDNAttentionBackend
(
AttentionBackend
):
@
staticmethod
def
get_name
()
->
str
:
return
"GDN_ATTN"
@
staticmethod
@
staticmethod
def
get_builder_cls
()
->
type
[
"GDNAttentionMetadataBuilder"
]:
def
get_builder_cls
()
->
type
[
"GDNAttentionMetadataBuilder"
]:
return
GDNAttentionMetadataBuilder
return
GDNAttentionMetadataBuilder
...
...
vllm/v1/attention/backends/linear_attn.py
View file @
160c6fa3
...
@@ -16,6 +16,10 @@ from vllm.v1.kv_cache_interface import AttentionSpec, MambaSpec
...
@@ -16,6 +16,10 @@ from vllm.v1.kv_cache_interface import AttentionSpec, MambaSpec
class
LinearAttentionBackend
(
AttentionBackend
):
class
LinearAttentionBackend
(
AttentionBackend
):
@
staticmethod
def
get_name
()
->
str
:
return
"LINEAR_ATTN"
@
staticmethod
@
staticmethod
def
get_builder_cls
()
->
type
[
"LinearAttentionMetadataBuilder"
]:
def
get_builder_cls
()
->
type
[
"LinearAttentionMetadataBuilder"
]:
return
LinearAttentionMetadataBuilder
return
LinearAttentionMetadataBuilder
...
...
vllm/v1/attention/backends/mamba1_attn.py
View file @
160c6fa3
...
@@ -11,6 +11,10 @@ from vllm.v1.attention.backends.mamba_attn import (
...
@@ -11,6 +11,10 @@ from vllm.v1.attention.backends.mamba_attn import (
class
Mamba1AttentionBackend
(
AttentionBackend
):
class
Mamba1AttentionBackend
(
AttentionBackend
):
@
staticmethod
def
get_name
()
->
str
:
return
"MAMBA1_ATTN"
@
staticmethod
@
staticmethod
def
get_builder_cls
()
->
type
[
"Mamba1AttentionMetadataBuilder"
]:
def
get_builder_cls
()
->
type
[
"Mamba1AttentionMetadataBuilder"
]:
return
Mamba1AttentionMetadataBuilder
return
Mamba1AttentionMetadataBuilder
...
...
vllm/v1/attention/backends/mamba2_attn.py
View file @
160c6fa3
...
@@ -7,7 +7,10 @@ import torch
...
@@ -7,7 +7,10 @@ import torch
from
vllm.config
import
VllmConfig
from
vllm.config
import
VllmConfig
from
vllm.utils.math_utils
import
cdiv
from
vllm.utils.math_utils
import
cdiv
from
vllm.v1.attention.backend
import
AttentionBackend
,
CommonAttentionMetadata
from
vllm.v1.attention.backend
import
(
AttentionBackend
,
CommonAttentionMetadata
,
)
from
vllm.v1.attention.backends.mamba_attn
import
(
from
vllm.v1.attention.backends.mamba_attn
import
(
BaseMambaAttentionMetadata
,
BaseMambaAttentionMetadata
,
BaseMambaAttentionMetadataBuilder
,
BaseMambaAttentionMetadataBuilder
,
...
@@ -85,6 +88,10 @@ def compute_varlen_chunk_metadata(
...
@@ -85,6 +88,10 @@ def compute_varlen_chunk_metadata(
class
Mamba2AttentionBackend
(
AttentionBackend
):
class
Mamba2AttentionBackend
(
AttentionBackend
):
@
staticmethod
def
get_name
()
->
str
:
return
"MAMBA2_ATTN"
@
staticmethod
@
staticmethod
def
get_builder_cls
()
->
type
[
"Mamba2AttentionMetadataBuilder"
]:
def
get_builder_cls
()
->
type
[
"Mamba2AttentionMetadataBuilder"
]:
return
Mamba2AttentionMetadataBuilder
return
Mamba2AttentionMetadataBuilder
...
...
vllm/v1/attention/backends/mla/indexer.py
View file @
160c6fa3
...
@@ -25,6 +25,10 @@ logger = init_logger(__name__)
...
@@ -25,6 +25,10 @@ logger = init_logger(__name__)
class
DeepseekV32IndexerBackend
(
AttentionBackend
):
class
DeepseekV32IndexerBackend
(
AttentionBackend
):
@
staticmethod
def
get_name
()
->
str
:
return
"DEEPSEEK_V32_INDEXER"
@
staticmethod
@
staticmethod
def
get_supported_kernel_block_sizes
()
->
list
[
int
|
MultipleOf
]:
def
get_supported_kernel_block_sizes
()
->
list
[
int
|
MultipleOf
]:
return
[
1
if
current_platform
.
is_rocm
()
else
64
]
return
[
1
if
current_platform
.
is_rocm
()
else
64
]
...
...
vllm/v1/attention/backends/short_conv_attn.py
View file @
160c6fa3
...
@@ -10,6 +10,10 @@ from vllm.v1.attention.backends.mamba_attn import (
...
@@ -10,6 +10,10 @@ from vllm.v1.attention.backends.mamba_attn import (
class
ShortConvAttentionBackend
(
AttentionBackend
):
class
ShortConvAttentionBackend
(
AttentionBackend
):
@
staticmethod
def
get_name
()
->
str
:
return
"SHORT_CONV_ATTN"
@
staticmethod
@
staticmethod
def
get_builder_cls
()
->
type
[
"ShortConvAttentionMetadataBuilder"
]:
def
get_builder_cls
()
->
type
[
"ShortConvAttentionMetadataBuilder"
]:
return
ShortConvAttentionMetadataBuilder
return
ShortConvAttentionMetadataBuilder
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment