"vscode:/vscode.git/clone" did not exist on "a4c402a756fa3213caf9d2cde0e4ceb2d57727f2"
Unverified Commit 0f3ce4c7 authored by Yan Ma's avatar Yan Ma Committed by GitHub
Browse files

[XPU] Fix spec-decode UTs under tests/v1/spec_decode (#38491)


Signed-off-by: default avatarYan Ma <yan.ma@intel.com>
Co-authored-by: default avatarKunshang Ji <kunshang.ji@intel.com>
parent af661a18
...@@ -755,12 +755,6 @@ def test_load_model( ...@@ -755,12 +755,6 @@ def test_load_model(
use_distinct_lm_head, use_distinct_lm_head,
monkeypatch, monkeypatch,
): ):
if attn_backend == "TRITON_ATTN" and not current_platform.is_rocm():
pytest.skip(
"TRITON_ATTN does not support "
"multi-token eagle spec decode on current platform"
)
if attn_backend == "ROCM_AITER_FA" and current_platform.is_rocm(): if attn_backend == "ROCM_AITER_FA" and current_platform.is_rocm():
monkeypatch.setenv("VLLM_ROCM_USE_AITER", "1") monkeypatch.setenv("VLLM_ROCM_USE_AITER", "1")
......
...@@ -15,8 +15,8 @@ DEVICE_TYPE = current_platform.device_type ...@@ -15,8 +15,8 @@ DEVICE_TYPE = current_platform.device_type
# Skip if no CUDA - Triton kernel requires GPU # Skip if no CUDA - Triton kernel requires GPU
pytest.importorskip("triton") pytest.importorskip("triton")
if not torch.cuda.is_available(): if not current_platform.is_cuda_alike() and not current_platform.is_xpu():
pytest.skip("CUDA required for EAGLE kernel tests", allow_module_level=True) pytest.skip("CUDA/XPU required for EAGLE kernel tests", allow_module_level=True)
def _reference_eagle_step_slot_mapping( def _reference_eagle_step_slot_mapping(
......
...@@ -38,12 +38,6 @@ def test_ngram_max_len(num_speculative_tokens: int): ...@@ -38,12 +38,6 @@ def test_ngram_max_len(num_speculative_tokens: int):
def test_eagle_max_len( def test_eagle_max_len(
monkeypatch: pytest.MonkeyPatch, num_speculative_tokens: int, attn_backend: str monkeypatch: pytest.MonkeyPatch, num_speculative_tokens: int, attn_backend: str
): ):
if attn_backend == "TRITON_ATTN" and not current_platform.is_rocm():
pytest.skip(
"TRITON_ATTN does not support "
"multi-token eagle spec decode on current platform"
)
if attn_backend == "ROCM_AITER_FA" and current_platform.is_rocm(): if attn_backend == "ROCM_AITER_FA" and current_platform.is_rocm():
monkeypatch.setenv("VLLM_ROCM_USE_AITER", "1") monkeypatch.setenv("VLLM_ROCM_USE_AITER", "1")
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment