Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
430dd4d9
Unverified
Commit
430dd4d9
authored
Nov 26, 2025
by
Matthew Bonanni
Committed by
GitHub
Nov 26, 2025
Browse files
[Attention] Remove imports from `vllm/attention/__init__.py` (#29342)
Signed-off-by:
Matthew Bonanni
<
mbonanni@redhat.com
>
parent
c4c0354e
Changes
96
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
24 additions
and
21 deletions
+24
-21
vllm/model_executor/models/gpt_bigcode.py
vllm/model_executor/models/gpt_bigcode.py
+1
-1
vllm/model_executor/models/gpt_j.py
vllm/model_executor/models/gpt_j.py
+1
-1
vllm/model_executor/models/gpt_neox.py
vllm/model_executor/models/gpt_neox.py
+1
-1
vllm/model_executor/models/gpt_oss.py
vllm/model_executor/models/gpt_oss.py
+2
-1
vllm/model_executor/models/granite.py
vllm/model_executor/models/granite.py
+1
-1
vllm/model_executor/models/granitemoe.py
vllm/model_executor/models/granitemoe.py
+1
-1
vllm/model_executor/models/grok1.py
vllm/model_executor/models/grok1.py
+1
-1
vllm/model_executor/models/hunyuan_v1.py
vllm/model_executor/models/hunyuan_v1.py
+2
-1
vllm/model_executor/models/internlm2.py
vllm/model_executor/models/internlm2.py
+1
-1
vllm/model_executor/models/jais.py
vllm/model_executor/models/jais.py
+1
-1
vllm/model_executor/models/lfm2.py
vllm/model_executor/models/lfm2.py
+1
-1
vllm/model_executor/models/lfm2_moe.py
vllm/model_executor/models/lfm2_moe.py
+1
-1
vllm/model_executor/models/llama.py
vllm/model_executor/models/llama.py
+2
-1
vllm/model_executor/models/llama4.py
vllm/model_executor/models/llama4.py
+1
-1
vllm/model_executor/models/minicpm.py
vllm/model_executor/models/minicpm.py
+1
-1
vllm/model_executor/models/minicpm3.py
vllm/model_executor/models/minicpm3.py
+1
-1
vllm/model_executor/models/minimax_m2.py
vllm/model_executor/models/minimax_m2.py
+1
-1
vllm/model_executor/models/minimax_text_01.py
vllm/model_executor/models/minimax_text_01.py
+2
-1
vllm/model_executor/models/mixtral.py
vllm/model_executor/models/mixtral.py
+1
-1
vllm/model_executor/models/molmo.py
vllm/model_executor/models/molmo.py
+1
-2
No files found.
vllm/model_executor/models/gpt_bigcode.py
View file @
430dd4d9
...
...
@@ -28,7 +28,7 @@ import torch
from
torch
import
nn
from
transformers
import
GPTBigCodeConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/gpt_j.py
View file @
430dd4d9
...
...
@@ -26,7 +26,7 @@ import torch
from
torch
import
nn
from
transformers
import
GPTJConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/gpt_neox.py
View file @
430dd4d9
...
...
@@ -26,7 +26,7 @@ import torch
from
torch
import
nn
from
transformers
import
GPTNeoXConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/gpt_oss.py
View file @
430dd4d9
...
...
@@ -7,7 +7,8 @@ import torch.distributed as dist
from
torch
import
nn
from
transformers
import
GptOssConfig
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/granite.py
View file @
430dd4d9
...
...
@@ -31,7 +31,7 @@ import torch
from
torch
import
nn
from
transformers
import
GraniteConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/granitemoe.py
View file @
430dd4d9
...
...
@@ -31,7 +31,7 @@ from typing import Any
import
torch
from
torch
import
nn
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/grok1.py
View file @
430dd4d9
...
...
@@ -31,7 +31,7 @@ import torch
import
torch.nn.functional
as
F
from
torch
import
nn
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/hunyuan_v1.py
View file @
430dd4d9
...
...
@@ -33,7 +33,8 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
,
get_current_vllm_config
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/internlm2.py
View file @
430dd4d9
...
...
@@ -10,7 +10,7 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/jais.py
View file @
430dd4d9
...
...
@@ -28,7 +28,7 @@ from itertools import islice
import
torch
from
torch
import
nn
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/lfm2.py
View file @
430dd4d9
...
...
@@ -7,7 +7,7 @@ import torch
import
torch.nn
as
nn
from
transformers
import
Lfm2Config
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
ModelConfig
,
VllmConfig
from
vllm.distributed
import
get_pp_group
,
get_tensor_model_parallel_world_size
...
...
vllm/model_executor/models/lfm2_moe.py
View file @
430dd4d9
...
...
@@ -6,7 +6,7 @@ from itertools import islice
import
torch
import
torch.nn
as
nn
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
ModelConfig
,
VllmConfig
,
get_current_vllm_config
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/llama.py
View file @
430dd4d9
...
...
@@ -31,7 +31,8 @@ import torch
from
torch
import
nn
from
transformers
import
LlamaConfig
from
vllm.attention
import
Attention
,
AttentionType
from
vllm.attention.backends.abstract
import
AttentionType
from
vllm.attention.layer
import
Attention
from
vllm.attention.layers.encoder_only_attention
import
EncoderOnlyAttention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
...
...
vllm/model_executor/models/llama4.py
View file @
430dd4d9
...
...
@@ -24,7 +24,7 @@ import torch
from
torch
import
nn
from
transformers
import
Llama4TextConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.attention.layers.chunked_local_attention
import
ChunkedLocalAttention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
...
...
vllm/model_executor/models/minicpm.py
View file @
430dd4d9
...
...
@@ -33,7 +33,7 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/minicpm3.py
View file @
430dd4d9
...
...
@@ -29,7 +29,7 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.distributed
import
get_tensor_model_parallel_world_size
from
vllm.model_executor.layers.layernorm
import
RMSNorm
...
...
vllm/model_executor/models/minimax_m2.py
View file @
430dd4d9
...
...
@@ -30,7 +30,7 @@ import torch
from
torch
import
nn
from
transformers
import
PretrainedConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
ModelConfig
,
VllmConfig
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/minimax_text_01.py
View file @
430dd4d9
...
...
@@ -14,7 +14,8 @@ import torch
from
torch
import
nn
from
transformers
import
MiniMaxConfig
from
vllm.attention
import
Attention
,
AttentionMetadata
from
vllm.attention.backends.abstract
import
AttentionMetadata
from
vllm.attention.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
ModelConfig
,
VllmConfig
from
vllm.distributed.parallel_state
import
(
...
...
vllm/model_executor/models/mixtral.py
View file @
430dd4d9
...
...
@@ -32,7 +32,7 @@ import torch
from
torch
import
nn
from
transformers
import
MixtralConfig
from
vllm.attention
import
Attention
from
vllm.attention
.layer
import
Attention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
,
get_current_vllm_config
from
vllm.distributed
import
(
...
...
vllm/model_executor/models/molmo.py
View file @
430dd4d9
...
...
@@ -17,8 +17,7 @@ from transformers import BatchFeature, PretrainedConfig, ProcessorMixin, TensorT
from
transformers.image_utils
import
ImageInput
from
transformers.tokenization_utils_base
import
TextInput
from
vllm.attention
import
Attention
from
vllm.attention.layer
import
MultiHeadAttention
from
vllm.attention.layer
import
Attention
,
MultiHeadAttention
from
vllm.compilation.decorators
import
support_torch_compile
from
vllm.config
import
CacheConfig
,
VllmConfig
from
vllm.config.multimodal
import
BaseDummyOptions
...
...
Prev
1
2
3
4
5
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment