"src/diffusers/models/attention2d.py" did not exist on "d8287fcd1d94f33df55b54e2e1c140c2ab15b444"
Unverified Commit 17c36c55 authored by Lianmin Zheng's avatar Lianmin Zheng Committed by GitHub
Browse files

[CI] Disabled deepep tests temporarily because it takes too much time. (#6186)

parent 31d1f6e7
...@@ -89,6 +89,25 @@ jobs: ...@@ -89,6 +89,25 @@ jobs:
cd test/srt cd test/srt
python3 run_suite.py --suite per-commit-2-gpu python3 run_suite.py --suite per-commit-2-gpu
unittest-test-backend-8-gpu:
if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
github.event.pull_request.draft == false
needs: [unit-test-frontend, unit-test-backend-1-gpu, unit-test-backend-2-gpu]
runs-on: 8-gpu-runner
steps:
- name: Checkout code
uses: actions/checkout@v4
- name: Install dependencies
run: |
bash scripts/ci_install_dependency.sh
- name: Run test
timeout-minutes: 20
run: |
cd test/srt
python3 run_suite.py --suite per-commit-8-gpu
performance-test-1-gpu-part-1: performance-test-1-gpu-part-1:
if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') && if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
github.event.pull_request.draft == false github.event.pull_request.draft == false
...@@ -262,7 +281,7 @@ jobs: ...@@ -262,7 +281,7 @@ jobs:
- name: Install dependencies - name: Install dependencies
run: | run: |
bash scripts/ci_install_dependency_8_gpu.sh bash scripts/ci_install_dependency.sh
- name: Run test - name: Run test
timeout-minutes: 10 timeout-minutes: 10
...@@ -270,35 +289,12 @@ jobs: ...@@ -270,35 +289,12 @@ jobs:
cd test/srt cd test/srt
python3 -m unittest test_disaggregation.TestDisaggregationMooncake.test_gsm8k python3 -m unittest test_disaggregation.TestDisaggregationMooncake.test_gsm8k
large-scale-test-8-gpu:
if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
github.event.pull_request.draft == false
needs: [
unit-test-frontend, unit-test-backend-1-gpu, unit-test-backend-2-gpu,
performance-test-1-gpu-part-1, performance-test-1-gpu-part-2, performance-test-2-gpu,
accuracy-test-1-gpu, accuracy-test-2-gpu,
]
runs-on: 8-gpu-runner
steps:
- name: Checkout code
uses: actions/checkout@v4
- name: Install dependencies
run: |
bash scripts/ci_install_dependency_8_gpu.sh
- name: Run test
timeout-minutes: 25
run: |
cd test/srt
python3 run_suite.py --suite per-commit-8-gpu
finish: finish:
if: always() if: always()
needs: [ needs: [
unit-test-frontend, unit-test-backend-1-gpu, unit-test-backend-2-gpu, unit-test-frontend, unit-test-backend-1-gpu, unit-test-backend-2-gpu, unittest-test-backend-8-gpu,
performance-test-1-gpu-part-1, performance-test-1-gpu-part-2, performance-test-2-gpu, performance-test-1-gpu-part-1, performance-test-1-gpu-part-2, performance-test-2-gpu,
accuracy-test-1-gpu, accuracy-test-2-gpu, large-scale-test-8-gpu, accuracy-test-1-gpu, accuracy-test-2-gpu,
] ]
runs-on: ubuntu-latest runs-on: ubuntu-latest
steps: steps:
......
...@@ -99,9 +99,11 @@ suites = { ...@@ -99,9 +99,11 @@ suites = {
TestFile("test_verl_engine.py", 64), TestFile("test_verl_engine.py", 64),
], ],
"per-commit-8-gpu": [ "per-commit-8-gpu": [
TestFile("test_deepep_intranode.py", 50), # Disabled deepep tests temporarily because it takes too much time.
TestFile("test_deepep_low_latency.py", 50), # TODO: re-enable them after reducing the test time with compilation cache and smaller models.
TestFile("test_moe_deepep_eval_accuracy_large.py", 250), # TestFile("test_deepep_intranode.py", 50),
# TestFile("test_deepep_low_latency.py", 50),
# TestFile("test_moe_deepep_eval_accuracy_large.py", 250),
TestFile("test_local_attn.py", 250), TestFile("test_local_attn.py", 250),
TestFile("test_full_deepseek_v3.py", 250), TestFile("test_full_deepseek_v3.py", 250),
TestFile("test_pp_single_node.py", 150), TestFile("test_pp_single_node.py", 150),
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment