"docs/vscode:/vscode.git/clone" did not exist on "387bdf0ab98615c1c01fb370ccd9a250b8ac9285"
Unverified Commit 83c9d525 authored by Wentao Ye's avatar Wentao Ye Committed by GitHub
Browse files

[CI] Add batch invariant test: Block FP8 + small MOE (#37895)


Signed-off-by: default avataryewentao256 <zhyanwentao@126.com>
parent 8f4824b6
......@@ -192,7 +192,7 @@ steps:
- pytest -v -s config
- label: Batch Invariance (H100)
timeout_in_minutes: 25
timeout_in_minutes: 30
device: h100
source_file_dependencies:
- vllm/v1/attention
......@@ -203,6 +203,8 @@ steps:
- pip install pytest-timeout pytest-forked
- pytest -v -s v1/determinism/test_batch_invariance.py
- pytest -v -s v1/determinism/test_rms_norm_batch_invariant.py
- VLLM_TEST_MODEL=deepseek-ai/DeepSeek-V2-Lite-Chat pytest -v -s v1/determinism/test_batch_invariance.py::test_v1_generation_is_deterministic_across_batch_sizes_with_needle[TRITON_MLA]
- VLLM_TEST_MODEL=Qwen/Qwen3-30B-A3B-Thinking-2507-FP8 pytest -v -s v1/determinism/test_batch_invariance.py::test_v1_generation_is_deterministic_across_batch_sizes_with_needle[FLASH_ATTN]
- label: Acceptance Length Test (Large Models) # optional
timeout_in_minutes: 25
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment