Unverified Commit 6790240c authored by Lianmin Zheng's avatar Lianmin Zheng Committed by GitHub
Browse files

Fix unit test order to balance the tasks in CI (#1665)

parent 061e5463
...@@ -76,7 +76,7 @@ jobs: ...@@ -76,7 +76,7 @@ jobs:
timeout-minutes: 20 timeout-minutes: 20
run: | run: |
cd test/srt cd test/srt
python3 run_suite.py --suite minimal --range-begin 5 --range-end 15 python3 run_suite.py --suite minimal --range-begin 5 --range-end 16
unit-test-backend-part-3: unit-test-backend-part-3:
if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request' if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
...@@ -96,7 +96,7 @@ jobs: ...@@ -96,7 +96,7 @@ jobs:
timeout-minutes: 20 timeout-minutes: 20
run: | run: |
cd test/srt cd test/srt
python3 run_suite.py --suite minimal --range-begin 15 python3 run_suite.py --suite minimal --range-begin 16
performance-test-1-gpu-part-1: performance-test-1-gpu-part-1:
if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request' if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
......
...@@ -421,6 +421,7 @@ class ScheduleBatch: ...@@ -421,6 +421,7 @@ class ScheduleBatch:
extend_lens: List[int] = None extend_lens: List[int] = None
extend_num_tokens: int = None extend_num_tokens: int = None
running_bs: int = None running_bs: int = None
decoding_reqs: List[Req] = None
# Stream # Stream
has_stream: bool = False has_stream: bool = False
......
...@@ -76,7 +76,9 @@ def run_eval(args): ...@@ -76,7 +76,9 @@ def run_eval(args):
def few_shot_gsm8k(s, question): def few_shot_gsm8k(s, question):
s += few_shot_examples + question s += few_shot_examples + question
s += sgl.gen( s += sgl.gen(
"answer", max_tokens=512, stop=["Question", "Assistant:", "<|separator|>"] "answer",
max_tokens=args.max_new_tokens,
stop=["Question", "Assistant:", "<|separator|>"],
) )
##################################### #####################################
...@@ -131,6 +133,7 @@ if __name__ == "__main__": ...@@ -131,6 +133,7 @@ if __name__ == "__main__":
parser.add_argument("--num-shots", type=int, default=5) parser.add_argument("--num-shots", type=int, default=5)
parser.add_argument("--data-path", type=str, default="test.jsonl") parser.add_argument("--data-path", type=str, default="test.jsonl")
parser.add_argument("--num-questions", type=int, default=200) parser.add_argument("--num-questions", type=int, default=200)
parser.add_argument("--max-new-tokens", type=int, default=512)
parser.add_argument("--parallel", type=int, default=128) parser.add_argument("--parallel", type=int, default=128)
parser.add_argument("--host", type=str, default="http://127.0.0.1") parser.add_argument("--host", type=str, default="http://127.0.0.1")
parser.add_argument("--port", type=int, default=30000) parser.add_argument("--port", type=int, default=30000)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment