"docs/vscode:/vscode.git/clone" did not exist on "28ef0165b91948a8ba9fabc8e993eb11f4c78a58"
Unverified Commit c8423ca3 authored by Yineng Zhang's avatar Yineng Zhang Committed by GitHub
Browse files

ci: update timeout and retry (#1086)


Co-authored-by: default avatarLiangsheng Yin <hnyls2002@gmail.com>
parent e205527c
...@@ -6,11 +6,13 @@ on: ...@@ -6,11 +6,13 @@ on:
paths: paths:
- "python/sglang/**" - "python/sglang/**"
- "test/**" - "test/**"
- ".github/workflows/accuracy-test.yml"
pull_request: pull_request:
branches: [ main ] branches: [ main ]
paths: paths:
- "python/sglang/**" - "python/sglang/**"
- "test/**" - "test/**"
- ".github/workflows/accuracy-test.yml"
workflow_dispatch: workflow_dispatch:
concurrency: concurrency:
...@@ -43,4 +45,4 @@ jobs: ...@@ -43,4 +45,4 @@ jobs:
run: | run: |
cd test/srt cd test/srt
python3 test_eval_accuracy_large.py python3 test_eval_accuracy_large.py
timeout-minutes: 20 timeout-minutes: 10
...@@ -6,11 +6,13 @@ on: ...@@ -6,11 +6,13 @@ on:
paths: paths:
- "python/sglang/**" - "python/sglang/**"
- "test/**" - "test/**"
- ".github/workflows/e2e-test.yml"
pull_request: pull_request:
branches: [ main ] branches: [ main ]
paths: paths:
- "python/sglang/**" - "python/sglang/**"
- "test/**" - "test/**"
- ".github/workflows/e2e-test.yml"
workflow_dispatch: workflow_dispatch:
concurrency: concurrency:
...@@ -39,13 +41,16 @@ jobs: ...@@ -39,13 +41,16 @@ jobs:
run: | run: |
cd test/srt cd test/srt
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default python3 -m unittest test_serving_throughput.TestServingThroughput.test_default
timeout-minutes: 10
- name: Benchmark Serving Throughput (w/o RadixAttention) - name: Benchmark Serving Throughput (w/o RadixAttention)
run: | run: |
cd test/srt cd test/srt
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_without_radix_cache python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_without_radix_cache
timeout-minutes: 10
- name: Benchmark Serving Throughput (w/ ChunkedPrefill) - name: Benchmark Serving Throughput (w/ ChunkedPrefill)
run: | run: |
cd test/srt cd test/srt
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_with_chunked_prefill python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_with_chunked_prefill
timeout-minutes: 10
...@@ -6,11 +6,13 @@ on: ...@@ -6,11 +6,13 @@ on:
paths: paths:
- "python/sglang/**" - "python/sglang/**"
- "test/**" - "test/**"
- ".github/workflows/moe-test.yml"
pull_request: pull_request:
branches: [ main ] branches: [ main ]
paths: paths:
- "python/sglang/**" - "python/sglang/**"
- "test/**" - "test/**"
- ".github/workflows/moe-test.yml"
workflow_dispatch: workflow_dispatch:
concurrency: concurrency:
...@@ -36,7 +38,12 @@ jobs: ...@@ -36,7 +38,12 @@ jobs:
pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.4/ --force-reinstall pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.4/ --force-reinstall
- name: Benchmark MOE Serving Throughput - name: Benchmark MOE Serving Throughput
run: | uses: nick-fields/retry@v3
with:
timeout_minutes: 15
max_attempts: 2
retry_on: error
command: |
cd test/srt cd test/srt
python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default
python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default_without_radix_cache python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default_without_radix_cache
...@@ -6,11 +6,13 @@ on: ...@@ -6,11 +6,13 @@ on:
paths: paths:
- "python/sglang/**" - "python/sglang/**"
- "test/**" - "test/**"
- ".github/workflows/unit-test.yml"
pull_request: pull_request:
branches: [ main ] branches: [ main ]
paths: paths:
- "python/sglang/**" - "python/sglang/**"
- "test/**" - "test/**"
- ".github/workflows/unit-test.yml"
workflow_dispatch: workflow_dispatch:
concurrency: concurrency:
...@@ -41,8 +43,10 @@ jobs: ...@@ -41,8 +43,10 @@ jobs:
run: | run: |
cd test/srt cd test/srt
python3 run_suite.py --suite minimal python3 run_suite.py --suite minimal
timeout-minutes: 15
- name: Test Frontend Language - name: Test Frontend Language
run: | run: |
cd test/lang cd test/lang
python3 run_suite.py --suite minimal python3 run_suite.py --suite minimal
timeout-minutes: 10
...@@ -73,7 +73,7 @@ class TestServingThroughput(unittest.TestCase): ...@@ -73,7 +73,7 @@ class TestServingThroughput(unittest.TestCase):
if os.getenv("SGLANG_IS_IN_CI", "false") == "true": if os.getenv("SGLANG_IS_IN_CI", "false") == "true":
# A100 (PCIE) performance # A100 (PCIE) performance
assert res["output_throughput"] > 950 assert res["output_throughput"] > 930
def test_default_without_radix_cache(self): def test_default_without_radix_cache(self):
res = self.run_test( res = self.run_test(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment