Unverified Commit 22e44ad5 authored by Micah Williamson's avatar Micah Williamson Committed by GitHub
Browse files

[ROCm][CI] Fix Weight Loading With Multiple GPU Tests on ROCm (#28984)


Signed-off-by: default avatarMicah Williamson <micah.williamson@amd.com>
parent 88f5b19f
...@@ -1323,7 +1323,7 @@ steps: ...@@ -1323,7 +1323,7 @@ steps:
- vllm/ - vllm/
- tests/weight_loading - tests/weight_loading
commands: commands:
- bash weight_loading/run_model_weight_loading_test.sh -c weight_loading/models.txt - bash weight_loading/run_model_weight_loading_test.sh -c weight_loading/models-amd.txt
- label: Weight Loading Multiple GPU Test - Large Models # optional - label: Weight Loading Multiple GPU Test - Large Models # optional
mirror_hardwares: [amdexperimental] mirror_hardwares: [amdexperimental]
...@@ -1331,13 +1331,12 @@ steps: ...@@ -1331,13 +1331,12 @@ steps:
# grade: Blocking # grade: Blocking
working_dir: "/vllm-workspace/tests" working_dir: "/vllm-workspace/tests"
num_gpus: 2 num_gpus: 2
gpu: a100
optional: true optional: true
source_file_dependencies: source_file_dependencies:
- vllm/ - vllm/
- tests/weight_loading - tests/weight_loading
commands: commands:
- bash weight_loading/run_model_weight_loading_test.sh -c weight_loading/models-large.txt - bash weight_loading/run_model_weight_loading_test.sh -c weight_loading/models-large-amd.txt
- label: NixlConnector PD accuracy tests (Distributed) # 30min - label: NixlConnector PD accuracy tests (Distributed) # 30min
mirror_hardwares: [amdexperimental] mirror_hardwares: [amdexperimental]
......
fp8, amd/Meta-Llama-3.1-8B-Instruct-FP8-KV, main
None, amd/Llama-3.2-1B-Instruct-FP8-KV, main
fp8, amd/Mixtral-8x7B-Instruct-v0.1-FP8-KV, main
fp8, amd/Meta-Llama-3.1-70B-Instruct-FP8-KV, main
None, microsoft/phi-4, main
fp8, amd/Mixtral-8x22B-Instruct-v0.1-FP8-KV, main
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment