Unverified Commit 6d85b36a authored by Vadim Gimpelson's avatar Vadim Gimpelson Committed by GitHub
Browse files

Revert #38730 and #38791 (#40032)


Signed-off-by: default avatarVadim Gimpelson <vadim.gimpelson@gmail.com>
Signed-off-by: default avatarVadim Gimpelson <156319763+vadiklyutiy@users.noreply.github.com>
parent ab5666eb
...@@ -72,7 +72,7 @@ def test_supports_sm100_with_artifactory(_art, _cap): ...@@ -72,7 +72,7 @@ def test_supports_sm100_with_artifactory(_art, _cap):
@patch("vllm.envs.VLLM_BATCH_INVARIANT", False) @patch("vllm.envs.VLLM_BATCH_INVARIANT", False)
@patch( @patch(
"vllm.utils.flashinfer.current_platform.is_device_capability", "vllm.utils.flashinfer.current_platform.is_device_capability_family",
return_value=False, return_value=False,
) )
def test_supports_non_sm100_platform(_cap): def test_supports_non_sm100_platform(_cap):
...@@ -81,7 +81,7 @@ def test_supports_non_sm100_platform(_cap): ...@@ -81,7 +81,7 @@ def test_supports_non_sm100_platform(_cap):
@patch("vllm.envs.VLLM_BATCH_INVARIANT", False) @patch("vllm.envs.VLLM_BATCH_INVARIANT", False)
@patch( @patch(
"vllm.utils.flashinfer.current_platform.is_device_capability", "vllm.utils.flashinfer.current_platform.is_device_capability_family",
return_value=True, return_value=True,
) )
@patch("vllm.utils.flashinfer.has_nvidia_artifactory", return_value=False) @patch("vllm.utils.flashinfer.has_nvidia_artifactory", return_value=False)
......
...@@ -235,11 +235,10 @@ def _resolve_import_to_file( ...@@ -235,11 +235,10 @@ def _resolve_import_to_file(
def _find_cc_in_function(tree: ast.AST, func_name: str) -> str | None: def _find_cc_in_function(tree: ast.AST, func_name: str) -> str | None:
"""Find a compute capability from is_device_capability*() calls in a function. """Find a compute capability from is_device_capability_family() calls in a function.
Handles two patterns: Looks for the pattern: current_platform.is_device_capability_family(N)
- is_device_capability_family(N): "M.x" (e.g. 100 -> "10.x") and converts N (e.g. 100) to a CC string (e.g. "10.x").
- is_device_capability(N): "M.m" (e.g. 100 -> "10.0")
""" """
for node in ast.walk(tree): for node in ast.walk(tree):
if not isinstance(node, ast.FunctionDef) or node.name != func_name: if not isinstance(node, ast.FunctionDef) or node.name != func_name:
...@@ -248,15 +247,12 @@ def _find_cc_in_function(tree: ast.AST, func_name: str) -> str | None: ...@@ -248,15 +247,12 @@ def _find_cc_in_function(tree: ast.AST, func_name: str) -> str | None:
if ( if (
isinstance(n, ast.Call) isinstance(n, ast.Call)
and isinstance(n.func, ast.Attribute) and isinstance(n.func, ast.Attribute)
and n.func.attr == "is_device_capability_family"
and n.args and n.args
and isinstance(n.args[0], ast.Constant) and isinstance(n.args[0], ast.Constant)
and isinstance(n.args[0].value, int) and isinstance(n.args[0].value, int)
): ):
val = n.args[0].value return f"{n.args[0].value // 10}.x"
if n.func.attr == "is_device_capability_family":
return f"{val // 10}.x"
elif n.func.attr == "is_device_capability":
return f"{val // 10}.{val % 10}"
return None return None
......
...@@ -305,6 +305,7 @@ def supports_trtllm_attention() -> bool: ...@@ -305,6 +305,7 @@ def supports_trtllm_attention() -> bool:
if envs.VLLM_BATCH_INVARIANT: if envs.VLLM_BATCH_INVARIANT:
return False return False
# Requires SM100 and NVIDIA artifactory to be accessible to download cubins
return ( return (
current_platform.is_device_capability_family(100) and has_nvidia_artifactory() current_platform.is_device_capability_family(100) and has_nvidia_artifactory()
) )
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment