Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
eebd1465
Unverified
Commit
eebd1465
authored
Mar 07, 2026
by
qli88
Committed by
GitHub
Mar 07, 2026
Browse files
[CI] Enable Crosslayer KV layout tests for ROCm platforms (#35416)
parent
ebb9cc5f
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
44 additions
and
13 deletions
+44
-13
.buildkite/test-amd.yaml
.buildkite/test-amd.yaml
+28
-0
tests/v1/kv_connector/nixl_integration/config_sweep_accuracy_test.sh
..._connector/nixl_integration/config_sweep_accuracy_test.sh
+16
-13
No files found.
.buildkite/test-amd.yaml
View file @
eebd1465
...
@@ -1486,6 +1486,20 @@ steps:
...
@@ -1486,6 +1486,20 @@ steps:
-
uv pip install --system -r /vllm-workspace/requirements/kv_connectors_rocm.txt
-
uv pip install --system -r /vllm-workspace/requirements/kv_connectors_rocm.txt
-
DP_EP=1 ROCM_ATTN=1 bash v1/kv_connector/nixl_integration/config_sweep_accuracy_test.sh
-
DP_EP=1 ROCM_ATTN=1 bash v1/kv_connector/nixl_integration/config_sweep_accuracy_test.sh
-
label
:
CrossLayer KV layout Distributed NixlConnector PD accuracy tests (4 GPUs)
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_4
# grade: Blocking
timeout_in_minutes
:
30
working_dir
:
"
/vllm-workspace/tests"
num_devices
:
4
source_file_dependencies
:
-
vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py
-
tests/v1/kv_connector/nixl_integration/
commands
:
-
uv pip install --system -r /vllm-workspace/requirements/kv_connectors_rocm.txt
-
CROSS_LAYERS_BLOCKS=1 ROCM_ATTN=1 bash v1/kv_connector/nixl_integration/config_sweep_accuracy_test.sh
##### multi gpus test #####
##### multi gpus test #####
##### A100 test #####
##### A100 test #####
...
@@ -3136,6 +3150,20 @@ steps:
...
@@ -3136,6 +3150,20 @@ steps:
-
uv pip install --system -r /vllm-workspace/requirements/kv_connectors_rocm.txt
-
uv pip install --system -r /vllm-workspace/requirements/kv_connectors_rocm.txt
-
DP_EP=1 ROCM_ATTN=1 bash v1/kv_connector/nixl_integration/config_sweep_accuracy_test.sh
-
DP_EP=1 ROCM_ATTN=1 bash v1/kv_connector/nixl_integration/config_sweep_accuracy_test.sh
-
label
:
CrossLayer KV layout Distributed NixlConnector PD accuracy tests (4 GPUs)
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_4
# grade: Blocking
timeout_in_minutes
:
30
working_dir
:
"
/vllm-workspace/tests"
num_devices
:
4
source_file_dependencies
:
-
vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py
-
tests/v1/kv_connector/nixl_integration/
commands
:
-
uv pip install --system -r /vllm-workspace/requirements/kv_connectors_rocm.txt
-
CROSS_LAYERS_BLOCKS=1 ROCM_ATTN=1 bash v1/kv_connector/nixl_integration/config_sweep_accuracy_test.sh
##### multi gpus test #####
##### multi gpus test #####
##### A100 test #####
##### A100 test #####
...
...
tests/v1/kv_connector/nixl_integration/config_sweep_accuracy_test.sh
View file @
eebd1465
...
@@ -56,24 +56,27 @@ run_tests() {
...
@@ -56,24 +56,27 @@ run_tests() {
echo
"✅ All
${
label
}
tests passed!"
echo
"✅ All
${
label
}
tests passed!"
}
}
# Run tests
# Set backend
label
=
"default backend"
cmdline_args
=
""
if
[[
-n
"
${
ROCM_ATTN
:-}
"
]]
;
then
if
[[
-n
"
${
ROCM_ATTN
:-}
"
]]
;
then
echo
"ROCM_ATTN is set, running with --attention-backend ROCM_ATTN"
echo
"ROCM_ATTN is set, running with --attention-backend ROCM_ATTN"
run_tests
"ROCM_ATTN backend"
"--attention-backend ROCM_ATTN"
label
=
"ROCM_ATTN backend"
else
cmdline_args
=
" --attention-backend ROCM_ATTN "
run_tests
"default backend"
""
elif
[[
-n
"
${
FLASHINFER
:-}
"
]]
;
then
fi
echo
"FLASHINFER is set, running with --attention-backend FLASHINFER"
label
=
"FLASHINFER backend"
# Check if FLASHINFER is set (non-empty)
cmdline_args
=
" --attention-backend FLASHINFER "
if
[[
-n
"
${
FLASHINFER
:-}
"
]]
;
then
echo
"FLASHINFER is set, rerunning with --attention-backend FLASHINFER"
run_tests
"FLASHINFER backend"
"--attention-backend FLASHINFER"
else
else
echo
"
FLASHINFER not set, skipping FLASHINFER runs.
"
echo
"
running with default attention backend
"
fi
fi
# Check if cross-layers is enabled (non-empty)
# Check if cross-layers is enabled (non-empty)
if
[[
-n
"
${
CROSS_LAYERS_BLOCKS
:-}
"
]]
;
then
if
[[
-n
"
${
CROSS_LAYERS_BLOCKS
:-}
"
]]
;
then
echo
"CROSS_LAYERS_BLOCKS is set, rerunning with --enable-cross-layers"
echo
"CROSS_LAYERS_BLOCKS is set, running with --enable-cross-layers"
run_tests
"default backend"
"--enable-cross-layers"
label+
=
" - CROSS_LAYERS_BLOCKS enabled"
cmdline_args+
=
" --enable-cross-layers "
fi
fi
# Run tests
run_tests
"
${
label
}
"
"
${
cmdline_args
}
"
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment