Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
430dd4d9
Unverified
Commit
430dd4d9
authored
Nov 26, 2025
by
Matthew Bonanni
Committed by
GitHub
Nov 26, 2025
Browse files
[Attention] Remove imports from `vllm/attention/__init__.py` (#29342)
Signed-off-by:
Matthew Bonanni
<
mbonanni@redhat.com
>
parent
c4c0354e
Changes
96
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
26 additions
and
20 deletions
+26
-20
vllm/model_executor/models/mpt.py
vllm/model_executor/models/mpt.py
+1
-1
vllm/model_executor/models/nemotron.py
vllm/model_executor/models/nemotron.py
+1
-1
vllm/model_executor/models/nemotron_nas.py
vllm/model_executor/models/nemotron_nas.py
+1
-1
vllm/model_executor/models/olmo.py
vllm/model_executor/models/olmo.py
+1
-1
vllm/model_executor/models/olmo2.py
vllm/model_executor/models/olmo2.py
+1
-1
vllm/model_executor/models/olmoe.py
vllm/model_executor/models/olmoe.py
+1
-1
vllm/model_executor/models/openpangu.py
vllm/model_executor/models/openpangu.py
+2
-1
vllm/model_executor/models/opt.py
vllm/model_executor/models/opt.py
+1
-1
vllm/model_executor/models/orion.py
vllm/model_executor/models/orion.py
+1
-1
vllm/model_executor/models/ouro.py
vllm/model_executor/models/ouro.py
+2
-1
vllm/model_executor/models/persimmon.py
vllm/model_executor/models/persimmon.py
+1
-1
vllm/model_executor/models/phi.py
vllm/model_executor/models/phi.py
+1
-1
vllm/model_executor/models/phimoe.py
vllm/model_executor/models/phimoe.py
+1
-1
vllm/model_executor/models/qwen.py
vllm/model_executor/models/qwen.py
+1
-1
vllm/model_executor/models/qwen2.py
vllm/model_executor/models/qwen2.py
+2
-1
vllm/model_executor/models/qwen2_moe.py
vllm/model_executor/models/qwen2_moe.py
+1
-1
vllm/model_executor/models/qwen3.py
vllm/model_executor/models/qwen3.py
+2
-1
vllm/model_executor/models/qwen3_moe.py
vllm/model_executor/models/qwen3_moe.py
+1
-1
vllm/model_executor/models/qwen3_next.py
vllm/model_executor/models/qwen3_next.py
+2
-1
vllm/model_executor/models/seed_oss.py
vllm/model_executor/models/seed_oss.py
+2
-1
No files found.
vllm/model_executor/models/mpt.py
View file @
430dd4d9
...
...
@@ -10,7 +10,7 @@ import torch
import
torch.nn
as
nn
from
transformers
import
MptConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/nemotron.py
View file @
430dd4d9
...
...
@@ -30,7 +30,7 @@ from itertools import islice
import
torch
from
torch
import
nn
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/nemotron_nas.py
View file @
430dd4d9
...
...
@@ -31,7 +31,7 @@ import torch
from
torch
import
nn
from
transformers
import
LlamaConfig
from
vllm.attention
import
AttentionType
from
vllm.attention
.backends.abstract
import
AttentionType
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
...
...
vllm/model_executor/models/olmo.py
View file @
430dd4d9
...
...
@@ -31,7 +31,7 @@ import torch
from
torch
import
nn
from
transformers
import
OlmoConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/olmo2.py
View file @
430dd4d9
...
...
@@ -32,7 +32,7 @@ import torch
from
torch
import
nn
from
transformers
import
Olmo2Config
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/olmoe.py
View file @
430dd4d9
...
...
@@ -21,7 +21,7 @@ from itertools import islice
import
torch
from
torch
import
nn
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/openpangu.py
View file @
430dd4d9
...
...
@@ -29,7 +29,8 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
ParallelConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/opt.py
View file @
430dd4d9
...
...
@@ -27,7 +27,7 @@ import torch
from
torch
import
nn
from
transformers
import
OPTConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/orion.py
View file @
430dd4d9
...
...
@@ -15,7 +15,7 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/ouro.py
View file @
430dd4d9
...
...
@@ -33,7 +33,8 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/persimmon.py
View file @
430dd4d9
...
...
@@ -30,7 +30,7 @@ import torch
from
torch
import
nn
from
transformers
import
PersimmonConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/phi.py
View file @
430dd4d9
...
...
@@ -45,7 +45,7 @@ import torch
from
torch
import
nn
from
transformers
import
PhiConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/phimoe.py
View file @
430dd4d9
...
...
@@ -31,7 +31,7 @@ import torch
from
torch
import
nn
from
transformers.configuration_utils
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/qwen.py
View file @
430dd4d9
...
...
@@ -16,7 +16,7 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/qwen2.py
View file @
430dd4d9
...
...
@@ -33,7 +33,8 @@ import torch
from
torch
import
nn
from
transformers
import
Qwen2Config
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.attention.layers.encoder_only_attention
import
EncoderOnlyAttention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
...
...
vllm/model_executor/models/qwen2_moe.py
View file @
430dd4d9
...
...
@@ -34,7 +34,7 @@ import torch.nn.functional as F
from
torch
import
nn
from
transformers
import
Qwen2MoeConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/qwen3.py
View file @
430dd4d9
...
...
@@ -30,7 +30,8 @@ import torch
from
torch
import
nn
from
transformers
import
Qwen3Config
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/qwen3_moe.py
View file @
430dd4d9
...
...
@@ -31,7 +31,7 @@ from typing import Any
import
torch
from
torch
import
nn
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
,
get_current_vllm_config
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/qwen3_next.py
View file @
430dd4d9
...
...
@@ -10,7 +10,8 @@ from einops import rearrange
from
torch
import
nn
from
transformers.activations
import
ACT2FN
from
vllm.attention
import
Attention
,
AttentionMetadata
from
vllm.attention.backends.abstract
import
AttentionMetadata
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
(
CacheConfig
,
...
...
vllm/model_executor/models/seed_oss.py
View file @
430dd4d9
...
...
@@ -30,7 +30,8 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
as
SeedOssConfig
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
Prev
1
2
3
4
5
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment