Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
zhaoyu6
sglang
Commits
2cadd51d
"vscode:/vscode.git/clone" did not exist on "47a1d6a85df1602833eedeb8cd3fb618c5e30cea"
Unverified
Commit
2cadd51d
authored
Mar 08, 2025
by
Lianmin Zheng
Committed by
GitHub
Mar 08, 2025
Browse files
Test no vllm custom allreduce (#4210)
parent
4a893d14
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
6 additions
and
2 deletions
+6
-2
.github/workflows/pr-test.yml
.github/workflows/pr-test.yml
+2
-0
test/srt/test_bench_one_batch.py
test/srt/test_bench_one_batch.py
+4
-2
No files found.
.github/workflows/pr-test.yml
View file @
2cadd51d
...
@@ -269,6 +269,8 @@ jobs:
...
@@ -269,6 +269,8 @@ jobs:
cd test/srt
cd test/srt
python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_moe_tp2_bs1
python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_moe_tp2_bs1
USE_VLLM_CUSTOM_ALLREDUCE=0 python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_moe_tp2_bs1
-
name
:
Benchmark single latency + torch.compile (TP=2)
-
name
:
Benchmark single latency + torch.compile (TP=2)
timeout-minutes
:
10
timeout-minutes
:
10
run
:
|
run
:
|
...
...
test/srt/test_bench_one_batch.py
View file @
2cadd51d
...
@@ -11,7 +11,9 @@ from sglang.test.test_utils import (
...
@@ -11,7 +11,9 @@ from sglang.test.test_utils import (
class
TestBenchOneBatch
(
unittest
.
TestCase
):
class
TestBenchOneBatch
(
unittest
.
TestCase
):
def
test_bs1
(
self
):
def
test_bs1
(
self
):
output_throughput
=
run_bench_one_batch
(
DEFAULT_MODEL_NAME_FOR_TEST
,
[])
output_throughput
=
run_bench_one_batch
(
DEFAULT_MODEL_NAME_FOR_TEST
,
[
"--cuda-graph-max-bs"
,
"2"
]
)
if
is_in_ci
():
if
is_in_ci
():
write_github_step_summary
(
write_github_step_summary
(
...
@@ -22,7 +24,7 @@ class TestBenchOneBatch(unittest.TestCase):
...
@@ -22,7 +24,7 @@ class TestBenchOneBatch(unittest.TestCase):
def
test_moe_tp2_bs1
(
self
):
def
test_moe_tp2_bs1
(
self
):
output_throughput
=
run_bench_one_batch
(
output_throughput
=
run_bench_one_batch
(
DEFAULT_MOE_MODEL_NAME_FOR_TEST
,
[
"--tp"
,
"2"
]
DEFAULT_MOE_MODEL_NAME_FOR_TEST
,
[
"--tp"
,
"2"
,
"--cuda-graph-max-bs"
,
"2"
]
)
)
if
is_in_ci
():
if
is_in_ci
():
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment