Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
143844fa
Unverified
Commit
143844fa
authored
Sep 29, 2025
by
Kunshang Ji
Committed by
GitHub
Sep 29, 2025
Browse files
[XPU]Fix xpu spec decoding UTs, avoid using cuda graph (#25847)
Signed-off-by:
Kunshang Ji
<
kunshang.ji@intel.com
>
parent
219cfbe7
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
7 additions
and
4 deletions
+7
-4
.buildkite/scripts/hardware_ci/run-xpu-test.sh
.buildkite/scripts/hardware_ci/run-xpu-test.sh
+1
-1
tests/utils.py
tests/utils.py
+2
-0
vllm/v1/spec_decode/eagle.py
vllm/v1/spec_decode/eagle.py
+4
-3
No files found.
.buildkite/scripts/hardware_ci/run-xpu-test.sh
View file @
143844fa
...
@@ -42,7 +42,7 @@ docker run \
...
@@ -42,7 +42,7 @@ docker run \
pytest -v -s v1/sample --ignore=v1/sample/test_logprobs.py --ignore=v1/sample/test_logprobs_e2e.py
pytest -v -s v1/sample --ignore=v1/sample/test_logprobs.py --ignore=v1/sample/test_logprobs_e2e.py
pytest -v -s v1/worker --ignore=v1/worker/test_gpu_model_runner.py
pytest -v -s v1/worker --ignore=v1/worker/test_gpu_model_runner.py
pytest -v -s v1/structured_output
pytest -v -s v1/structured_output
pytest -v -s v1/spec_decode --ignore=v1/spec_decode/test_max_len.py
--ignore=v1/spec_decode/test_eagle.py
--ignore=v1/spec_decode/test_tree_attention.py
pytest -v -s v1/spec_decode --ignore=v1/spec_decode/test_max_len.py --ignore=v1/spec_decode/test_tree_attention.py
pytest -v -s v1/kv_connector/unit --ignore=v1/kv_connector/unit/test_multi_connector.py --ignore=v1/kv_connector/unit/test_nixl_connector.py --ignore=v1/kv_connector/unit/test_shared_storage_connector.py
pytest -v -s v1/kv_connector/unit --ignore=v1/kv_connector/unit/test_multi_connector.py --ignore=v1/kv_connector/unit/test_nixl_connector.py --ignore=v1/kv_connector/unit/test_shared_storage_connector.py
pytest -v -s v1/test_metrics
pytest -v -s v1/test_metrics
pytest -v -s v1/test_serial_utils.py
pytest -v -s v1/test_serial_utils.py
...
...
tests/utils.py
View file @
143844fa
...
@@ -1143,6 +1143,8 @@ def get_attn_backend_list_based_on_platform() -> list[str]:
...
@@ -1143,6 +1143,8 @@ def get_attn_backend_list_based_on_platform() -> list[str]:
print
(
"Skip FLASH_ATTN on ROCm as aiter is not installed"
)
print
(
"Skip FLASH_ATTN on ROCm as aiter is not installed"
)
return
attn_backend_list
return
attn_backend_list
elif
current_platform
.
is_xpu
():
return
[
"FLASH_ATTN"
,
"TRITON_ATTN"
]
else
:
else
:
raise
ValueError
(
"Unsupported platform"
)
raise
ValueError
(
"Unsupported platform"
)
...
...
vllm/v1/spec_decode/eagle.py
View file @
143844fa
...
@@ -72,12 +72,13 @@ class EagleProposer:
...
@@ -72,12 +72,13 @@ class EagleProposer:
self
.
attn_metadata_builder
:
Optional
[
AttentionMetadataBuilder
]
=
None
self
.
attn_metadata_builder
:
Optional
[
AttentionMetadataBuilder
]
=
None
self
.
use_cuda_graph
=
(
self
.
vllm_config
.
compilation_config
.
level
self
.
use_cuda_graph
=
(
not
current_platform
.
is_xpu
()
and
self
.
vllm_config
.
compilation_config
.
level
==
CompilationLevel
.
PIECEWISE
and
==
CompilationLevel
.
PIECEWISE
and
not
self
.
vllm_config
.
model_config
.
enforce_eager
)
not
self
.
vllm_config
.
model_config
.
enforce_eager
)
self
.
cudagraph_batch_sizes
=
list
(
self
.
cudagraph_batch_sizes
=
list
(
reversed
(
reversed
(
self
.
vllm_config
.
compilation_config
.
self
.
vllm_config
.
compilation_config
.
cudagraph_capture_sizes
))
cudagraph_capture_sizes
))
if
self
.
use_cuda_graph
else
[]
# persistent buffers for cuda graph
# persistent buffers for cuda graph
self
.
input_ids
=
torch
.
zeros
(
self
.
max_num_tokens
,
self
.
input_ids
=
torch
.
zeros
(
self
.
max_num_tokens
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment