Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
430dd4d9
Unverified
Commit
430dd4d9
authored
Nov 26, 2025
by
Matthew Bonanni
Committed by
GitHub
Nov 26, 2025
Browse files
[Attention] Remove imports from `vllm/attention/__init__.py` (#29342)
Signed-off-by:
Matthew Bonanni
<
mbonanni@redhat.com
>
parent
c4c0354e
Changes
96
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
22 additions
and
21 deletions
+22
-21
vllm/model_executor/models/bloom.py
vllm/model_executor/models/bloom.py
+1
-1
vllm/model_executor/models/chameleon.py
vllm/model_executor/models/chameleon.py
+1
-1
vllm/model_executor/models/chatglm.py
vllm/model_executor/models/chatglm.py
+1
-1
vllm/model_executor/models/clip.py
vllm/model_executor/models/clip.py
+1
-2
vllm/model_executor/models/commandr.py
vllm/model_executor/models/commandr.py
+1
-1
vllm/model_executor/models/dbrx.py
vllm/model_executor/models/dbrx.py
+1
-1
vllm/model_executor/models/deepseek_v2.py
vllm/model_executor/models/deepseek_v2.py
+1
-1
vllm/model_executor/models/dots1.py
vllm/model_executor/models/dots1.py
+1
-1
vllm/model_executor/models/ernie45_moe.py
vllm/model_executor/models/ernie45_moe.py
+1
-1
vllm/model_executor/models/ernie45_vl_moe.py
vllm/model_executor/models/ernie45_vl_moe.py
+1
-1
vllm/model_executor/models/exaone.py
vllm/model_executor/models/exaone.py
+1
-1
vllm/model_executor/models/exaone4.py
vllm/model_executor/models/exaone4.py
+1
-1
vllm/model_executor/models/falcon.py
vllm/model_executor/models/falcon.py
+1
-1
vllm/model_executor/models/gemma.py
vllm/model_executor/models/gemma.py
+1
-1
vllm/model_executor/models/gemma2.py
vllm/model_executor/models/gemma2.py
+1
-1
vllm/model_executor/models/gemma3.py
vllm/model_executor/models/gemma3.py
+2
-1
vllm/model_executor/models/gemma3n.py
vllm/model_executor/models/gemma3n.py
+1
-1
vllm/model_executor/models/glm4.py
vllm/model_executor/models/glm4.py
+2
-1
vllm/model_executor/models/glm4_moe.py
vllm/model_executor/models/glm4_moe.py
+1
-1
vllm/model_executor/models/gpt2.py
vllm/model_executor/models/gpt2.py
+1
-1
No files found.
vllm/model_executor/models/bloom.py
View file @
430dd4d9
...
...
@@ -27,7 +27,7 @@ import torch
from
torch
import
nn
from
transformers
import
BloomConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/chameleon.py
View file @
430dd4d9
...
...
@@ -16,7 +16,7 @@ from transformers import (
ChameleonVQVAEConfig
,
)
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.config.multimodal
import
BaseDummyOptions
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/chatglm.py
View file @
430dd4d9
...
...
@@ -12,7 +12,7 @@ import torch
from
torch
import
nn
from
torch.nn
import
LayerNorm
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/clip.py
View file @
430dd4d9
...
...
@@ -14,8 +14,7 @@ from transformers import (
CLIPVisionConfig
,
)
from
vllm.attention
import
Attention
from
vllm.attention.layer
import
MultiHeadAttention
from
vllm.attention.layer
import
Attention
,
MultiHeadAttention
from
vllm.config
import
VllmConfig
from
vllm.config.multimodal
import
BaseDummyOptions
from
vllm.distributed
import
divide
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/commandr.py
View file @
430dd4d9
...
...
@@ -30,7 +30,7 @@ import torch
from
torch
import
nn
from
transformers
import
Cohere2Config
,
CohereConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/dbrx.py
View file @
430dd4d9
...
...
@@ -8,7 +8,7 @@ import torch
import
torch.nn
as
nn
from
transformers
import
DbrxConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
(
get_pp_group
,
...
...
vllm/model_executor/models/deepseek_v2.py
View file @
430dd4d9
...
...
@@ -33,8 +33,8 @@ from torch import nn
from
transformers
import
DeepseekV2Config
,
DeepseekV3Config
from
vllm._aiter_ops
import
rocm_aiter_ops
from
vllm.attention
import
Attention
from
vllm.attention.backends.abstract
import
AttentionBackend
from
vllm.attention.layer
import
Attention
from
vllm.attention.ops.common
import
pack_seq_triton
,
unpack_seq_triton
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
ParallelConfig
,
VllmConfig
,
get_current_vllm_config
...
...
vllm/model_executor/models/dots1.py
View file @
430dd4d9
...
...
@@ -32,7 +32,7 @@ import torch
from
torch
import
nn
from
transformers
import
Dots1Config
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
ModelConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/ernie45_moe.py
View file @
430dd4d9
...
...
@@ -32,7 +32,7 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
,
get_current_vllm_config
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/ernie45_vl_moe.py
View file @
430dd4d9
...
...
@@ -31,7 +31,7 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
# from vllm.compilation.decorators import support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
...
...
vllm/model_executor/models/exaone.py
View file @
430dd4d9
...
...
@@ -32,7 +32,7 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/exaone4.py
View file @
430dd4d9
...
...
@@ -28,7 +28,7 @@ import torch
from
torch
import
nn
from
transformers
import
Exaone4Config
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/falcon.py
View file @
430dd4d9
...
...
@@ -30,7 +30,7 @@ from torch import nn
from
torch.nn
import
LayerNorm
from
transformers
import
FalconConfig
as
HF_FalconConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/gemma.py
View file @
430dd4d9
...
...
@@ -26,7 +26,7 @@ import torch
from
torch
import
nn
from
transformers
import
GemmaConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/gemma2.py
View file @
430dd4d9
...
...
@@ -23,7 +23,7 @@ import torch
from
torch
import
nn
from
transformers
import
Gemma2Config
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/gemma3.py
View file @
430dd4d9
...
...
@@ -23,7 +23,8 @@ import torch.nn.functional as F
from
torch
import
nn
from
transformers
import
Gemma3TextConfig
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/gemma3n.py
View file @
430dd4d9
...
...
@@ -21,7 +21,7 @@ import torch
from
torch
import
nn
from
transformers.models.gemma3n.configuration_gemma3n
import
Gemma3nTextConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/glm4.py
View file @
430dd4d9
...
...
@@ -29,7 +29,8 @@ import torch
from
torch
import
nn
from
transformers
import
Glm4Config
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/glm4_moe.py
View file @
430dd4d9
...
...
@@ -31,7 +31,7 @@ import torch
from
torch
import
nn
from
transformers.models.glm4_moe
import
Glm4MoeConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
,
get_current_vllm_config
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/gpt2.py
View file @
430dd4d9
...
...
@@ -27,7 +27,7 @@ import torch
from
torch
import
nn
from
transformers
import
GPT2Config
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed.parallel_state
import
(
...
...
Prev
1
2
3
4
5
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment