refactor: abstract deepgemm support into platform (#37519)

Co-authored-by: sherryC41 <sherry.c.c41@gmail.com>

refactor: abstract deepgemm support into platform (#37519)
Co-authored-by: sherryC41 <sherry.c.c41@gmail.com>
6ec5e9fd · SherryC41 · GitHub · e1d85e5c · 6ec5e9fd · 6ec5e9fd
Unverified Commit 6ec5e9fd authored Mar 21, 2026 by SherryC41 Committed by GitHub Mar 20, 2026
Show whitespace changes
Inline Side-by-side

Showing with 13 additions and 4 deletions

vllm/platforms/cuda.py vllm/platforms/cuda.py +5 -0

vllm/platforms/interface.py vllm/platforms/interface.py +7 -0

vllm/utils/deep_gemm.py vllm/utils/deep_gemm.py +1 -4

No files found.
--- a/vllm/platforms/cuda.py
+++ b/vllm/platforms/cuda.py
@@ -511,6 +511,11 @@ class CudaPlatformBase(Platform):
    def support_static_graph_mode(cls) -> bool:
        return True

+    @classmethod
+    def support_deep_gemm(cls) -> bool:
+        """Currently, only Hopper and Blackwell GPUs are supported."""
+        return cls.is_device_capability(90) or cls.is_device_capability_family(100)
+
    @classmethod
    def num_compute_units(cls, device_id: int = 0) -> int:
        return torch.cuda.get_device_properties(device_id).multi_processor_count

--- a/vllm/platforms/interface.py
+++ b/vllm/platforms/interface.py
@@ -712,6 +712,13 @@ class Platform:
        """
        return False

+    @classmethod
+    def support_deep_gemm(cls) -> bool:
+        """
+        Returns if DeepGEMM is supported by the current platform.
+        """
+        return False
+
    @classmethod
    def use_custom_op_collectives(cls) -> bool:
        """

--- a/vllm/utils/deep_gemm.py
+++ b/vllm/utils/deep_gemm.py
@@ -70,10 +70,7 @@ def is_deep_gemm_supported() -> bool:
    """Return `True` if DeepGEMM is supported on the current platform.
    Currently, only Hopper and Blackwell GPUs are supported.
    """
-    is_supported_arch = current_platform.is_cuda() and (
-        current_platform.is_device_capability(90)
-        or current_platform.is_device_capability_family(100)
-    )
+    is_supported_arch = current_platform.support_deep_gemm()
    return envs.VLLM_USE_DEEP_GEMM and has_deep_gemm() and is_supported_arch