Unverified Commit 0b8e871e authored by Zhewen Li's avatar Zhewen Li Committed by GitHub
Browse files

[CI/Build] Fix `test_defaults_with_usage_context` in AMD CI (#27926)


Signed-off-by: default avatarzhewenli <zhewenli@meta.com>
parent 5ee93a59
...@@ -53,10 +53,12 @@ def test_defaults_with_usage_context(): ...@@ -53,10 +53,12 @@ def test_defaults_with_usage_context():
vllm_config: VllmConfig = engine_args.create_engine_config(UsageContext.LLM_CLASS) vllm_config: VllmConfig = engine_args.create_engine_config(UsageContext.LLM_CLASS)
from vllm.platforms import current_platform from vllm.platforms import current_platform
from vllm.utils.mem_constants import GiB_bytes
device_memory = current_platform.get_device_total_memory()
device_name = current_platform.get_device_name().lower() device_name = current_platform.get_device_name().lower()
if "h100" in device_name or "h200" in device_name: if device_memory >= 70 * GiB_bytes and "a100" not in device_name:
# For H100 and H200, we use larger default values. # For GPUs like H100, H200, and MI300x with >= 70GB memory
default_llm_tokens = 16384 default_llm_tokens = 16384
default_server_tokens = 8192 default_server_tokens = 8192
default_max_num_seqs = 1024 default_max_num_seqs = 1024
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment