Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
81939e77
Unverified
Commit
81939e77
authored
Mar 10, 2026
by
Andreas Karatzas
Committed by
GitHub
Mar 10, 2026
Browse files
[ROCm][CI] Making some tests optional to reduce workload (#36090)
Signed-off-by:
Andreas Karatzas
<
akaratza@amd.com
>
parent
195d1ca3
Changes
5
Hide whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
117 additions
and
34 deletions
+117
-34
.buildkite/test-amd.yaml
.buildkite/test-amd.yaml
+117
-4
.buildkite/test_areas/basic_correctness.yaml
.buildkite/test_areas/basic_correctness.yaml
+0
-5
.buildkite/test_areas/entrypoints.yaml
.buildkite/test_areas/entrypoints.yaml
+0
-15
.buildkite/test_areas/misc.yaml
.buildkite/test_areas/misc.yaml
+0
-5
.buildkite/test_areas/plugins.yaml
.buildkite/test_areas/plugins.yaml
+0
-5
No files found.
.buildkite/test-amd.yaml
View file @
81939e77
...
...
@@ -42,6 +42,7 @@ steps:
mirror_hardwares
:
[
amdexperimental
,
amdproduction
,
amdtentative
]
agent_pool
:
mi325_1
grade
:
Blocking
optional
:
true
soft_fail
:
true
source_file_dependencies
:
-
requirements/nightly_torch_test.txt
...
...
@@ -67,6 +68,7 @@ steps:
timeout_in_minutes
:
30
mirror_hardwares
:
[
amdexperimental
,
amdproduction
,
amdtentative
]
agent_pool
:
mi325_1
optional
:
true
# grade: Blocking
source_file_dependencies
:
-
vllm/
...
...
@@ -97,6 +99,7 @@ steps:
timeout_in_minutes
:
20
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi325_1
optional
:
true
# grade: Blocking
source_file_dependencies
:
-
tests/standalone_tests/python_only_compile.sh
...
...
@@ -140,6 +143,7 @@ steps:
timeout_in_minutes
:
40
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_1
optional
:
true
# grade: Blocking
working_dir
:
"
/vllm-workspace/tests"
fast_check
:
true
...
...
@@ -503,6 +507,7 @@ steps:
mirror_hardwares
:
[
amdexperimental
,
amdproduction
,
amdtentative
]
agent_pool
:
mi325_1
grade
:
Blocking
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/v1
...
...
@@ -520,6 +525,7 @@ steps:
timeout_in_minutes
:
45
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_1
optional
:
true
# grade: Blocking
working_dir
:
"
/vllm-workspace/examples"
source_file_dependencies
:
...
...
@@ -823,6 +829,7 @@ steps:
timeout_in_minutes
:
90
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_1
optional
:
true
# grade: Blocking
source_file_dependencies
:
-
csrc/
...
...
@@ -936,6 +943,7 @@ steps:
timeout_in_minutes
:
25
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_1
optional
:
true
# grade: Blocking
torch_nightly
:
true
source_file_dependencies
:
...
...
@@ -1046,6 +1054,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_1
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/models/multimodal
...
...
@@ -1059,6 +1068,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_1
optional
:
true
# grade: Blocking
source_file_dependencies
:
-
vllm/
...
...
@@ -1072,6 +1082,7 @@ steps:
timeout_in_minutes
:
100
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_1
optional
:
true
# grade: Blocking
torch_nightly
:
true
source_file_dependencies
:
...
...
@@ -1090,6 +1101,7 @@ steps:
timeout_in_minutes
:
10
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_1
optional
:
true
# grade: Blocking
working_dir
:
"
/vllm-workspace/.buildkite/lm-eval-harness"
source_file_dependencies
:
...
...
@@ -1355,6 +1367,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_2
optional
:
true
# grade: Blocking
working_dir
:
"
/vllm-workspace/tests"
num_gpus
:
2
...
...
@@ -1393,6 +1406,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_4
optional
:
true
# grade: Blocking
working_dir
:
"
/vllm-workspace/tests"
num_gpus
:
4
...
...
@@ -1410,6 +1424,7 @@ steps:
timeout_in_minutes
:
30
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_4
optional
:
true
# grade: Blocking
num_gpus
:
4
source_file_dependencies
:
...
...
@@ -1461,6 +1476,7 @@ steps:
-
label
:
NixlConnector PD accuracy tests (Distributed)
# 30min
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_4
optional
:
true
# grade: Blocking
timeout_in_minutes
:
30
working_dir
:
"
/vllm-workspace/tests"
...
...
@@ -1475,6 +1491,7 @@ steps:
-
label
:
DP EP NixlConnector PD accuracy tests (Distributed)
# 15min
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi325_4
optional
:
true
# grade: Blocking
timeout_in_minutes
:
15
working_dir
:
"
/vllm-workspace/tests"
...
...
@@ -1779,6 +1796,7 @@ steps:
# in /vllm/tools/pre_commit/generate_nightly_torch_test.py
mirror_hardwares
:
[
amdexperimental
,
amdproduction
,
amdtentative
]
agent_pool
:
mi355_1
optional
:
true
soft_fail
:
true
source_file_dependencies
:
-
requirements/nightly_torch_test.txt
...
...
@@ -1789,6 +1807,7 @@ steps:
timeout_in_minutes
:
15
mirror_hardwares
:
[
amdexperimental
,
amdproduction
,
amdtentative
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/multimodal
...
...
@@ -1801,6 +1820,7 @@ steps:
timeout_in_minutes
:
30
mirror_hardwares
:
[
amdexperimental
,
amdproduction
,
amdtentative
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/test_inputs.py
...
...
@@ -1830,6 +1850,7 @@ steps:
timeout_in_minutes
:
20
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
tests/standalone_tests/python_only_compile.sh
-
setup.py
...
...
@@ -1840,6 +1861,7 @@ steps:
timeout_in_minutes
:
30
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
fast_check
:
true
torch_nightly
:
true
source_file_dependencies
:
...
...
@@ -1870,6 +1892,7 @@ steps:
timeout_in_minutes
:
40
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
working_dir
:
"
/vllm-workspace/tests"
fast_check
:
true
torch_nightly
:
true
...
...
@@ -1887,6 +1910,7 @@ steps:
timeout_in_minutes
:
130
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
working_dir
:
"
/vllm-workspace/tests"
fast_check
:
true
torch_nightly
:
true
...
...
@@ -1903,6 +1927,7 @@ steps:
timeout_in_minutes
:
50
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
working_dir
:
"
/vllm-workspace/tests"
fast_check
:
true
torch_nightly
:
true
...
...
@@ -1921,6 +1946,7 @@ steps:
timeout_in_minutes
:
50
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
working_dir
:
"
/vllm-workspace/tests"
fast_check
:
true
torch_nightly
:
true
...
...
@@ -1935,6 +1961,7 @@ steps:
timeout_in_minutes
:
50
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
working_dir
:
"
/vllm-workspace/tests"
fast_check
:
true
torch_nightly
:
true
...
...
@@ -2013,6 +2040,7 @@ steps:
timeout_in_minutes
:
10
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_8
optional
:
true
gpu
:
h100
num_gpus
:
8
working_dir
:
"
/vllm-workspace/tests"
...
...
@@ -2033,6 +2061,7 @@ steps:
-
label
:
EPLB Algorithm Test
# 5min
mirror_hardwares
:
[
amdexperimental
,
amdproduction
,
amdtentative
]
agent_pool
:
mi355_1
optional
:
true
timeout_in_minutes
:
15
working_dir
:
"
/vllm-workspace/tests"
source_file_dependencies
:
...
...
@@ -2044,6 +2073,7 @@ steps:
-
label
:
EPLB Execution Test
# 10min
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_4
optional
:
true
timeout_in_minutes
:
20
working_dir
:
"
/vllm-workspace/tests"
num_gpus
:
4
...
...
@@ -2058,6 +2088,7 @@ steps:
timeout_in_minutes
:
20
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_2
optional
:
true
num_gpus
:
2
source_file_dependencies
:
-
vllm/
...
...
@@ -2099,12 +2130,13 @@ steps:
commands
:
-
pytest -v -s engine test_sequence.py test_config.py test_logger.py test_vllm_port.py
-
label
:
V1 Test e2e + engine
# 65min
timeout_in_minutes
:
90
mirror_hardwares
:
[
amdexperimental
]
# The test uses 4 GPUs, but we schedule it on 8-GPU machines for stability.
# See discussion here: https://github.com/vllm-project/vllm/pull/31040
agent_pool
:
mi355_8
agent_pool
:
mi355_1
optional
:
true
# grade: Blocking
source_file_dependencies
:
-
vllm/
-
tests/v1
...
...
@@ -2114,10 +2146,39 @@ steps:
-
pytest -v -s v1/e2e
-
pytest -v -s v1/engine
-
label
:
V1 Test e2e (2 GPUs)
# 65min
timeout_in_minutes
:
90
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_2
optional
:
true
# grade: Blocking
source_file_dependencies
:
-
vllm/
-
tests/v1
commands
:
# Only run tests that need exactly 2 GPUs
-
pytest -v -s v1/e2e/test_spec_decode.py -k "tensor_parallelism"
-
label
:
V1 Test e2e (4 GPUs)
# 65min
timeout_in_minutes
:
90
mirror_hardwares
:
[
amdexperimental
]
# The test uses 4 GPUs, but we schedule it on 8-GPU machines for stability.
# See discussion here: https://github.com/vllm-project/vllm/pull/31040
agent_pool
:
mi355_4
optional
:
true
# grade: Blocking
source_file_dependencies
:
-
vllm/
-
tests/v1
commands
:
# Only run tests that need 4 GPUs
-
pytest -v -s v1/e2e/test_spec_decode.py -k "eagle_correctness_heavy"
-
label
:
V1 Test entrypoints
# 35min
timeout_in_minutes
:
50
mirror_hardwares
:
[
amdexperimental
,
amdproduction
,
amdtentative
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/v1
...
...
@@ -2128,6 +2189,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/v1
...
...
@@ -2150,7 +2212,19 @@ steps:
-
pip install -U git+https://github.com/robertgshaw2-redhat/lm-evaluation-harness.git@streaming-api
-
pytest -v -s entrypoints/openai/correctness/test_lmeval.py::test_lm_eval_accuracy_v1_engine
# TODO: Add the "V1 Test attention (MI300)" test group
-
label
:
V1 Test attention (H100)
# 10min
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
timeout_in_minutes
:
30
gpu
:
h100
source_file_dependencies
:
-
vllm/config/attention.py
-
vllm/model_executor/layers/attention
-
vllm/v1/attention
-
tests/v1/attention
commands
:
-
pytest -v -s v1/attention
-
label
:
Batch Invariance Tests (H100)
# 10min
mirror_hardwares
:
[
amdexperimental
]
...
...
@@ -2200,6 +2274,7 @@ steps:
timeout_in_minutes
:
45
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
working_dir
:
"
/vllm-workspace/examples"
source_file_dependencies
:
-
vllm/entrypoints
...
...
@@ -2234,6 +2309,7 @@ steps:
timeout_in_minutes
:
15
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/cuda
...
...
@@ -2245,6 +2321,7 @@ steps:
timeout_in_minutes
:
75
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/model_executor/layers
-
vllm/sampling_metadata.py
...
...
@@ -2277,6 +2354,7 @@ steps:
timeout_in_minutes
:
30
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
torch_nightly
:
true
source_file_dependencies
:
-
vllm/
...
...
@@ -2293,6 +2371,7 @@ steps:
timeout_in_minutes
:
30
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
torch_nightly
:
true
source_file_dependencies
:
-
vllm/
...
...
@@ -2308,6 +2387,7 @@ steps:
timeout_in_minutes
:
40
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
# grade: Blocking
torch_nightly
:
true
source_file_dependencies
:
...
...
@@ -2325,6 +2405,7 @@ steps:
timeout_in_minutes
:
20
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
tests/v1/cudagraph
-
vllm/v1/cudagraph_dispatcher.py
...
...
@@ -2338,6 +2419,7 @@ steps:
timeout_in_minutes
:
75
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
csrc/
-
tests/kernels/core
...
...
@@ -2349,6 +2431,7 @@ steps:
timeout_in_minutes
:
35
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
csrc/attention/
-
vllm/v1/attention
...
...
@@ -2363,6 +2446,7 @@ steps:
timeout_in_minutes
:
90
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
csrc/quantization/
-
vllm/model_executor/layers/quantization
...
...
@@ -2375,6 +2459,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
csrc/quantization/cutlass_w8a8/moe/
-
csrc/moe/
...
...
@@ -2391,6 +2476,7 @@ steps:
timeout_in_minutes
:
45
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
csrc/mamba/
-
tests/kernels/mamba
...
...
@@ -2422,6 +2508,7 @@ steps:
timeout_in_minutes
:
30
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/utils/import_utils.py
-
tests/kernels/helion/
...
...
@@ -2434,6 +2521,7 @@ steps:
torch_nightly
:
true
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/engine/arg_utils.py
-
vllm/config/model.py
...
...
@@ -2450,6 +2538,7 @@ steps:
timeout_in_minutes
:
20
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
working_dir
:
"
/vllm-workspace/.buildkite"
source_file_dependencies
:
-
benchmarks/
...
...
@@ -2460,6 +2549,7 @@ steps:
timeout_in_minutes
:
20
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/benchmarks/
...
...
@@ -2470,6 +2560,7 @@ steps:
timeout_in_minutes
:
90
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
csrc/
-
vllm/model_executor/layers/quantization
...
...
@@ -2490,6 +2581,7 @@ steps:
timeout_in_minutes
:
75
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
csrc/
-
vllm/model_executor/layers/quantization
...
...
@@ -2501,6 +2593,7 @@ steps:
timeout_in_minutes
:
15
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
csrc/
-
vllm/entrypoints/openai/
...
...
@@ -2517,6 +2610,7 @@ steps:
timeout_in_minutes
:
45
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
torch_nightly
:
true
source_file_dependencies
:
-
vllm/
...
...
@@ -2529,6 +2623,7 @@ steps:
timeout_in_minutes
:
45
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
torch_nightly
:
true
source_file_dependencies
:
-
vllm/model_executor/models/
...
...
@@ -2548,6 +2643,7 @@ steps:
timeout_in_minutes
:
45
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
torch_nightly
:
true
source_file_dependencies
:
-
vllm/
...
...
@@ -2560,6 +2656,7 @@ steps:
-
label
:
Basic Models Test (Other CPU)
# 5min
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
timeout_in_minutes
:
10
torch_nightly
:
true
source_file_dependencies
:
...
...
@@ -2574,6 +2671,7 @@ steps:
timeout_in_minutes
:
25
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
torch_nightly
:
true
source_file_dependencies
:
-
vllm/
...
...
@@ -2587,6 +2685,7 @@ steps:
timeout_in_minutes
:
45
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
torch_nightly
:
true
source_file_dependencies
:
-
vllm/model_executor/models/
...
...
@@ -2607,6 +2706,7 @@ steps:
timeout_in_minutes
:
75
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
torch_nightly
:
true
source_file_dependencies
:
-
vllm/
...
...
@@ -2676,6 +2776,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/models/multimodal
...
...
@@ -2688,6 +2789,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/models/multimodal
...
...
@@ -2699,6 +2801,7 @@ steps:
timeout_in_minutes
:
100
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_1
optional
:
true
torch_nightly
:
true
source_file_dependencies
:
-
vllm/
...
...
@@ -2716,6 +2819,7 @@ steps:
timeout_in_minutes
:
10
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
working_dir
:
"
/vllm-workspace/.buildkite/lm-eval-harness"
source_file_dependencies
:
-
vllm/multimodal/
...
...
@@ -2772,6 +2876,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_1
optional
:
true
source_file_dependencies
:
-
vllm/model_executor/layers/quantization
-
tests/models/quantization
...
...
@@ -2923,6 +3028,7 @@ steps:
timeout_in_minutes
:
20
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_2
optional
:
true
working_dir
:
"
/vllm-workspace/tests"
num_gpus
:
2
source_file_dependencies
:
...
...
@@ -3005,6 +3111,7 @@ steps:
timeout_in_minutes
:
50
mirror_hardwares
:
[
amdexperimental
]
agent_pool
:
mi355_2
optional
:
true
working_dir
:
"
/vllm-workspace/tests"
num_gpus
:
2
source_file_dependencies
:
...
...
@@ -3026,6 +3133,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_2
optional
:
true
working_dir
:
"
/vllm-workspace/tests"
num_gpus
:
2
source_file_dependencies
:
...
...
@@ -3063,6 +3171,7 @@ steps:
timeout_in_minutes
:
60
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_4
optional
:
true
working_dir
:
"
/vllm-workspace/tests"
num_gpus
:
4
source_file_dependencies
:
...
...
@@ -3079,6 +3188,7 @@ steps:
timeout_in_minutes
:
30
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_4
optional
:
true
num_gpus
:
4
source_file_dependencies
:
-
vllm/lora
...
...
@@ -3127,6 +3237,7 @@ steps:
-
label
:
NixlConnector PD accuracy tests (Distributed)
# 30min
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_4
optional
:
true
timeout_in_minutes
:
30
working_dir
:
"
/vllm-workspace/tests"
num_gpus
:
4
...
...
@@ -3140,6 +3251,7 @@ steps:
-
label
:
DP EP NixlConnector PD accuracy tests (Distributed)
# 15min
mirror_hardwares
:
[
amdexperimental
,
amdproduction
]
agent_pool
:
mi355_4
optional
:
true
timeout_in_minutes
:
15
working_dir
:
"
/vllm-workspace/tests"
num_gpus
:
4
...
...
@@ -3278,6 +3390,7 @@ steps:
-
label
:
ROCm LM Eval Large Models (8 Card)
mirror_hardwares
:
[
amdproduction
]
agent_pool
:
mi355_8
optional
:
true
num_gpus
:
8
working_dir
:
"
/vllm-workspace/.buildkite/lm-eval-harness"
commands
:
...
...
.buildkite/test_areas/basic_correctness.yaml
View file @
81939e77
...
...
@@ -14,8 +14,3 @@ steps:
-
pytest -v -s basic_correctness/test_cumem.py
-
pytest -v -s basic_correctness/test_basic_correctness.py
-
pytest -v -s basic_correctness/test_cpu_offload.py
mirror
:
amd
:
device
:
mi325_1
depends_on
:
-
image-build-amd
.buildkite/test_areas/entrypoints.yaml
View file @
81939e77
...
...
@@ -24,11 +24,6 @@ steps:
-
pytest -v -s entrypoints/llm --ignore=entrypoints/llm/test_generate.py --ignore=entrypoints/llm/test_collective_rpc.py
-
pytest -v -s entrypoints/llm/test_generate.py
# it needs a clean process
-
pytest -v -s entrypoints/offline_mode
# Needs to avoid interference with other tests
mirror
:
amd
:
device
:
mi325_1
depends_on
:
-
image-build-amd
-
label
:
Entrypoints Integration (API Server 1)
timeout_in_minutes
:
130
...
...
@@ -60,11 +55,6 @@ steps:
-
pytest -v -s entrypoints/instrumentator
-
PYTHONPATH=/vllm-workspace pytest -v -s entrypoints/rpc
-
pytest -v -s tool_use
mirror
:
amd
:
device
:
mi325_1
depends_on
:
-
image-build-amd
-
label
:
Entrypoints Integration (Pooling)
timeout_in_minutes
:
50
...
...
@@ -75,11 +65,6 @@ steps:
commands
:
-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
-
pytest -v -s entrypoints/pooling
mirror
:
amd
:
device
:
mi325_1
depends_on
:
-
image-build-amd
-
label
:
Entrypoints Integration (Responses API)
timeout_in_minutes
:
50
...
...
.buildkite/test_areas/misc.yaml
View file @
81939e77
...
...
@@ -88,11 +88,6 @@ steps:
-
python3 offline_inference/spec_decode.py --test --method eagle --num_spec_tokens 3 --dataset-name hf --dataset-path philschmid/mt-bench --num-prompts 80 --temp 0 --top-p 1.0 --top-k -1 --tp 1 --enable-chunked-prefill --max-model-len
2048
# https://github.com/vllm-project/vllm/pull/26682 uses slightly more memory in PyTorch 2.9+ causing this test to OOM in 1xL4 GPU
-
python3 offline_inference/spec_decode.py --test --method eagle3 --num_spec_tokens 3 --dataset-name hf --dataset-path philschmid/mt-bench --num-prompts 80 --temp 0 --top-p 1.0 --top-k -1 --tp 1 --enable-chunked-prefill --max-model-len
1536
mirror
:
amd
:
device
:
mi325_1
depends_on
:
-
image-build-amd
-
label
:
Metrics, Tracing (2 GPUs)
timeout_in_minutes
:
20
...
...
.buildkite/test_areas/plugins.yaml
View file @
81939e77
...
...
@@ -39,8 +39,3 @@ steps:
-
pytest -v -s entrypoints/openai/test_oot_registration.py
# it needs a clean process
-
pytest -v -s models/test_oot_registration.py
# it needs a clean process
-
pytest -v -s plugins/lora_resolvers
# unit tests for in-tree lora resolver plugins
mirror
:
amd
:
device
:
mi325_2
depends_on
:
-
image-build-amd
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment