Unverified Commit 443c7cf4 authored by youkaichao's avatar youkaichao Committed by GitHub
Browse files

[ci][distributed] fix flaky tests (#6806)

parent 1adddb14
"""
WARNING: This test runs in both single-node (4 GPUs) and multi-node
(2 node with 2 GPUs each) modes. If the test only uses 2 GPUs, it is
important to set the distributed backend to "mp" to avoid Ray scheduling
all workers in a node other than the head node, which can cause the test
to fail.
"""
import os import os
import pytest import pytest
...@@ -78,7 +85,7 @@ def test_pp_cudagraph(PP_SIZE, MODEL_NAME, ATTN_BACKEND): ...@@ -78,7 +85,7 @@ def test_pp_cudagraph(PP_SIZE, MODEL_NAME, ATTN_BACKEND):
"--pipeline-parallel-size", "--pipeline-parallel-size",
str(PP_SIZE), str(PP_SIZE),
"--distributed-executor-backend", "--distributed-executor-backend",
"ray", "mp",
] ]
os.environ["VLLM_ATTENTION_BACKEND"] = ATTN_BACKEND os.environ["VLLM_ATTENTION_BACKEND"] = ATTN_BACKEND
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment