Unverified Commit 246e3e0a authored by tracelogfb's avatar tracelogfb Committed by GitHub
Browse files

fix broken test vllm:test_kernels - test_attention_selector.py::test_flash_attn (#17873)


Co-authored-by: default avatarStephen Chen <tracelog@meta.com>
parent 7042cc96
......@@ -188,8 +188,9 @@ def test_flash_attn(monkeypatch: pytest.MonkeyPatch):
m.setenv(STR_BACKEND_ENV_VAR, STR_FLASH_ATTN_VAL)
# Unsupported CUDA arch
monkeypatch.setattr(torch.cuda, "get_device_capability", lambda:
(7, 5))
monkeypatch.setattr(torch.cuda,
"get_device_capability",
lambda _=None: (7, 5))
backend = get_attn_backend(16, torch.float16, None, 16, False)
assert backend.get_name() != STR_FLASH_ATTN_VAL
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment