Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
de2cc3d8
Unverified
Commit
de2cc3d8
authored
Sep 15, 2025
by
Wentao Ye
Committed by
GitHub
Sep 15, 2025
Browse files
[Deprecation] Remove DeepGEMM Old Symbol Wrapper (#24902)
Signed-off-by:
yewentao256
<
zhyanwentao@126.com
>
parent
e9508430
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
3 additions
and
25 deletions
+3
-25
vllm/utils/deep_gemm.py
vllm/utils/deep_gemm.py
+3
-25
No files found.
vllm/utils/deep_gemm.py
View file @
de2cc3d8
...
...
@@ -67,23 +67,6 @@ def _missing(*_: Any, **__: Any) -> NoReturn:
"package to enable FP8 kernels."
)
def
_resolve_symbol
(
module
,
new
:
str
,
old
:
str
)
->
Callable
[...,
Any
]
|
None
:
"""Return the *new* symbol if it exists, otherwise the *old* one."""
if
hasattr
(
module
,
new
):
return
getattr
(
module
,
new
)
if
hasattr
(
module
,
old
):
# TODO(wentao): deprecate old symbol in the future.
logger
.
warning_once
(
"Found legacy DeepGEMM symbol `%s`. Please upgrade the `deep_gemm` "
"package so that `%s` is available. Support for the legacy symbol "
"will be removed in a future vLLM release."
,
old
,
new
,
)
return
getattr
(
module
,
old
)
return
None
_fp8_gemm_nt_impl
:
Callable
[...,
Any
]
|
None
=
None
_grouped_impl
:
Callable
[...,
Any
]
|
None
=
None
_grouped_masked_impl
:
Callable
[...,
Any
]
|
None
=
None
...
...
@@ -109,14 +92,9 @@ def _lazy_init() -> None:
_dg
=
importlib
.
import_module
(
"deep_gemm"
)
_fp8_gemm_nt_impl
=
_resolve_symbol
(
_dg
,
"fp8_gemm_nt"
,
"gemm_fp8_fp8_bf16_nt"
)
_grouped_impl
=
_resolve_symbol
(
_dg
,
"m_grouped_fp8_gemm_nt_contiguous"
,
"m_grouped_gemm_fp8_fp8_bf16_nt_contiguous"
)
_grouped_masked_impl
=
_resolve_symbol
(
_dg
,
"fp8_m_grouped_gemm_nt_masked"
,
"m_grouped_gemm_fp8_fp8_bf16_nt_masked"
)
_fp8_gemm_nt_impl
=
getattr
(
_dg
,
"fp8_gemm_nt"
,
None
)
_grouped_impl
=
getattr
(
_dg
,
"m_grouped_fp8_gemm_nt_contiguous"
,
None
)
_grouped_masked_impl
=
getattr
(
_dg
,
"fp8_m_grouped_gemm_nt_masked"
,
None
)
def
fp8_gemm_nt
(
*
args
,
**
kwargs
):
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment