Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
6ec5e9fd
Unverified
Commit
6ec5e9fd
authored
Mar 21, 2026
by
SherryC41
Committed by
GitHub
Mar 20, 2026
Browse files
refactor: abstract deepgemm support into platform (#37519)
Co-authored-by:
sherryC41
<
sherry.c.c41@gmail.com
>
parent
e1d85e5c
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
13 additions
and
4 deletions
+13
-4
vllm/platforms/cuda.py
vllm/platforms/cuda.py
+5
-0
vllm/platforms/interface.py
vllm/platforms/interface.py
+7
-0
vllm/utils/deep_gemm.py
vllm/utils/deep_gemm.py
+1
-4
No files found.
vllm/platforms/cuda.py
View file @
6ec5e9fd
...
@@ -511,6 +511,11 @@ class CudaPlatformBase(Platform):
...
@@ -511,6 +511,11 @@ class CudaPlatformBase(Platform):
def
support_static_graph_mode
(
cls
)
->
bool
:
def
support_static_graph_mode
(
cls
)
->
bool
:
return
True
return
True
@
classmethod
def
support_deep_gemm
(
cls
)
->
bool
:
"""Currently, only Hopper and Blackwell GPUs are supported."""
return
cls
.
is_device_capability
(
90
)
or
cls
.
is_device_capability_family
(
100
)
@
classmethod
@
classmethod
def
num_compute_units
(
cls
,
device_id
:
int
=
0
)
->
int
:
def
num_compute_units
(
cls
,
device_id
:
int
=
0
)
->
int
:
return
torch
.
cuda
.
get_device_properties
(
device_id
).
multi_processor_count
return
torch
.
cuda
.
get_device_properties
(
device_id
).
multi_processor_count
...
...
vllm/platforms/interface.py
View file @
6ec5e9fd
...
@@ -712,6 +712,13 @@ class Platform:
...
@@ -712,6 +712,13 @@ class Platform:
"""
"""
return
False
return
False
@
classmethod
def
support_deep_gemm
(
cls
)
->
bool
:
"""
Returns if DeepGEMM is supported by the current platform.
"""
return
False
@
classmethod
@
classmethod
def
use_custom_op_collectives
(
cls
)
->
bool
:
def
use_custom_op_collectives
(
cls
)
->
bool
:
"""
"""
...
...
vllm/utils/deep_gemm.py
View file @
6ec5e9fd
...
@@ -70,10 +70,7 @@ def is_deep_gemm_supported() -> bool:
...
@@ -70,10 +70,7 @@ def is_deep_gemm_supported() -> bool:
"""Return `True` if DeepGEMM is supported on the current platform.
"""Return `True` if DeepGEMM is supported on the current platform.
Currently, only Hopper and Blackwell GPUs are supported.
Currently, only Hopper and Blackwell GPUs are supported.
"""
"""
is_supported_arch
=
current_platform
.
is_cuda
()
and
(
is_supported_arch
=
current_platform
.
support_deep_gemm
()
current_platform
.
is_device_capability
(
90
)
or
current_platform
.
is_device_capability_family
(
100
)
)
return
envs
.
VLLM_USE_DEEP_GEMM
and
has_deep_gemm
()
and
is_supported_arch
return
envs
.
VLLM_USE_DEEP_GEMM
and
has_deep_gemm
()
and
is_supported_arch
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment