"vscode:/vscode.git/clone" did not exist on "e61138be19cce30b1cf9e16dd8c35bbdbb86530d"
Unverified Commit 3c4e0ee6 authored by Lianmin Zheng's avatar Lianmin Zheng Committed by GitHub
Browse files

[CI] Tune threshold (#5787)

parent 9c088829
...@@ -82,10 +82,10 @@ suites = { ...@@ -82,10 +82,10 @@ suites = {
TestFile("test_triton_moe_channel_fp8_kernel.py", 25), TestFile("test_triton_moe_channel_fp8_kernel.py", 25),
], ],
"per-commit-2-gpu": [ "per-commit-2-gpu": [
TestFile("models/lora/test_lora_tp.py", 300), TestFile("models/lora/test_lora_tp.py", 150),
TestFile("test_data_parallelism.py", 90), TestFile("test_data_parallelism.py", 90),
TestFile("test_dp_attention.py", 90), TestFile("test_dp_attention.py", 150),
TestFile("test_mla_tp.py", 420), TestFile("test_mla_tp.py", 174),
TestFile("test_moe_ep.py", 220), TestFile("test_moe_ep.py", 220),
TestFile("test_patch_torch.py", 30), TestFile("test_patch_torch.py", 30),
TestFile("test_update_weights_from_distributed.py", 100), TestFile("test_update_weights_from_distributed.py", 100),
......
...@@ -51,7 +51,7 @@ class TestBenchOneBatch(CustomTestCase): ...@@ -51,7 +51,7 @@ class TestBenchOneBatch(CustomTestCase):
f"### test_torch_compile_tp2_bs1\n" f"### test_torch_compile_tp2_bs1\n"
f"output_throughput : {output_throughput:.2f} token/s\n" f"output_throughput : {output_throughput:.2f} token/s\n"
) )
self.assertGreater(output_throughput, 235) self.assertGreater(output_throughput, 225)
if __name__ == "__main__": if __name__ == "__main__":
......
...@@ -28,7 +28,7 @@ class TestTorchNativeAttnBackend(CustomTestCase): ...@@ -28,7 +28,7 @@ class TestTorchNativeAttnBackend(CustomTestCase):
if is_in_ci(): if is_in_ci():
# Torch native backend is expected to be slower # Torch native backend is expected to be slower
assert output_throughput > 50, f"{output_throughput=}" self.assertGreater(output_throughput, 40)
def test_mmlu(self): def test_mmlu(self):
model = DEFAULT_MODEL_NAME_FOR_TEST model = DEFAULT_MODEL_NAME_FOR_TEST
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment