Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
15ddd843
"integration/llm_image_test.go" did not exist on "9adca7f71128c09759fd0bc0b9a146f4e79fe935"
Unverified
Commit
15ddd843
authored
Mar 26, 2025
by
fzyzcjy
Committed by
GitHub
Mar 25, 2025
Browse files
Add retry for flaky tests in CI (#4755)
parent
52029bd1
Changes
112
Show whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
49 additions
and
30 deletions
+49
-30
test/srt/test_matched_stop.py
test/srt/test_matched_stop.py
+2
-1
test/srt/test_metrics.py
test/srt/test_metrics.py
+2
-1
test/srt/test_mla.py
test/srt/test_mla.py
+2
-1
test/srt/test_mla_deepseek_v3.py
test/srt/test_mla_deepseek_v3.py
+3
-2
test/srt/test_mla_flashinfer.py
test/srt/test_mla_flashinfer.py
+4
-3
test/srt/test_mla_fp8.py
test/srt/test_mla_fp8.py
+2
-1
test/srt/test_mla_int8_deepseek_v3.py
test/srt/test_mla_int8_deepseek_v3.py
+5
-4
test/srt/test_mla_tp.py
test/srt/test_mla_tp.py
+2
-1
test/srt/test_modelopt_fp8kvcache.py
test/srt/test_modelopt_fp8kvcache.py
+2
-1
test/srt/test_models_from_modelscope.py
test/srt/test_models_from_modelscope.py
+2
-1
test/srt/test_moe_deepep.py
test/srt/test_moe_deepep.py
+2
-1
test/srt/test_moe_ep.py
test/srt/test_moe_ep.py
+3
-2
test/srt/test_moe_eval_accuracy_large.py
test/srt/test_moe_eval_accuracy_large.py
+2
-1
test/srt/test_nightly_gsm8k_eval.py
test/srt/test_nightly_gsm8k_eval.py
+2
-1
test/srt/test_nightly_human_eval.py
test/srt/test_nightly_human_eval.py
+2
-1
test/srt/test_nightly_math_eval.py
test/srt/test_nightly_math_eval.py
+2
-1
test/srt/test_no_chunked_prefill.py
test/srt/test_no_chunked_prefill.py
+2
-1
test/srt/test_no_overlap_scheduler.py
test/srt/test_no_overlap_scheduler.py
+2
-2
test/srt/test_openai_server.py
test/srt/test_openai_server.py
+4
-3
test/srt/test_page_size.py
test/srt/test_page_size.py
+2
-1
No files found.
test/srt/test_matched_stop.py
View file @
15ddd843
...
...
@@ -7,6 +7,7 @@ from sglang.srt.utils import kill_process_tree
from
sglang.test.test_utils
import
(
DEFAULT_MODEL_NAME_FOR_TEST
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
...
...
@@ -18,7 +19,7 @@ The story should span multiple events, challenges, and character developments ov
"""
class
TestMatchedStop
(
unittest
.
TestCase
):
class
TestMatchedStop
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_MODEL_NAME_FOR_TEST
...
...
test/srt/test_metrics.py
View file @
15ddd843
...
...
@@ -7,11 +7,12 @@ from sglang.test.test_utils import (
DEFAULT_SMALL_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestEnableMetrics
(
unittest
.
TestCase
):
class
TestEnableMetrics
(
Custom
TestCase
):
def
test_metrics_enabled
(
self
):
"""Test that metrics endpoint returns data when enabled"""
process
=
popen_launch_server
(
...
...
test/srt/test_mla.py
View file @
15ddd843
...
...
@@ -7,11 +7,12 @@ from sglang.test.test_utils import (
DEFAULT_MLA_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestMLA
(
unittest
.
TestCase
):
class
TestMLA
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_MLA_MODEL_NAME_FOR_TEST
...
...
test/srt/test_mla_deepseek_v3.py
View file @
15ddd843
...
...
@@ -9,11 +9,12 @@ from sglang.test.few_shot_gsm8k import run_eval as run_eval_few_shot_gsm8k
from
sglang.test.test_utils
import
(
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestMLADeepseekV3
(
unittest
.
TestCase
):
class
TestMLADeepseekV3
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"lmsys/sglang-ci-dsv3-test"
...
...
@@ -48,7 +49,7 @@ class TestMLADeepseekV3(unittest.TestCase):
self
.
assertGreater
(
metrics
[
"accuracy"
],
0.62
)
class
TestDeepseekV3MTP
(
unittest
.
TestCase
):
class
TestDeepseekV3MTP
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"lmsys/sglang-ci-dsv3-test"
...
...
test/srt/test_mla_flashinfer.py
View file @
15ddd843
...
...
@@ -9,11 +9,12 @@ from sglang.test.few_shot_gsm8k import run_eval as run_eval_few_shot_gsm8k
from
sglang.test.test_utils
import
(
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestFlashinferMLA
(
unittest
.
TestCase
):
class
TestFlashinferMLA
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"lmsys/sglang-ci-dsv3-test"
...
...
@@ -55,7 +56,7 @@ class TestFlashinferMLA(unittest.TestCase):
self
.
assertGreater
(
metrics
[
"accuracy"
],
0.62
)
class
TestFlashinferMLANoRagged
(
unittest
.
TestCase
):
class
TestFlashinferMLANoRagged
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"lmsys/sglang-ci-dsv3-test"
...
...
@@ -99,7 +100,7 @@ class TestFlashinferMLANoRagged(unittest.TestCase):
self
.
assertGreater
(
metrics
[
"accuracy"
],
0.62
)
class
TestFlashinferMLAMTP
(
unittest
.
TestCase
):
class
TestFlashinferMLAMTP
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"lmsys/sglang-ci-dsv3-test"
...
...
test/srt/test_mla_fp8.py
View file @
15ddd843
...
...
@@ -7,11 +7,12 @@ from sglang.test.test_utils import (
DEFAULT_MLA_FP8_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestMLA
(
unittest
.
TestCase
):
class
TestMLA
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_MLA_FP8_MODEL_NAME_FOR_TEST
...
...
test/srt/test_mla_int8_deepseek_v3.py
View file @
15ddd843
...
...
@@ -9,11 +9,12 @@ from sglang.test.few_shot_gsm8k import run_eval as run_eval_few_shot_gsm8k
from
sglang.test.test_utils
import
(
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestMLADeepseekV3ChannelInt8
(
unittest
.
TestCase
):
class
TestMLADeepseekV3ChannelInt8
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"sgl-project/sglang-ci-dsv3-channel-int8-test"
...
...
@@ -48,7 +49,7 @@ class TestMLADeepseekV3ChannelInt8(unittest.TestCase):
self
.
assertGreater
(
metrics
[
"accuracy"
],
0.62
)
class
TestDeepseekV3MTPChannelInt8
(
unittest
.
TestCase
):
class
TestDeepseekV3MTPChannelInt8
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"sgl-project/sglang-ci-dsv3-channel-int8-test"
...
...
@@ -109,7 +110,7 @@ class TestDeepseekV3MTPChannelInt8(unittest.TestCase):
self
.
assertGreater
(
avg_spec_accept_length
,
2.5
)
class
TestMLADeepseekV3BlockInt8
(
unittest
.
TestCase
):
class
TestMLADeepseekV3BlockInt8
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"sgl-project/sglang-ci-dsv3-block-int8-test"
...
...
@@ -144,7 +145,7 @@ class TestMLADeepseekV3BlockInt8(unittest.TestCase):
self
.
assertGreater
(
metrics
[
"accuracy"
],
0.62
)
class
TestDeepseekV3MTPBlockInt8
(
unittest
.
TestCase
):
class
TestDeepseekV3MTPBlockInt8
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"sgl-project/sglang-ci-dsv3-block-int8-test"
...
...
test/srt/test_mla_tp.py
View file @
15ddd843
...
...
@@ -8,11 +8,12 @@ from sglang.test.few_shot_gsm8k import run_eval as run_eval_few_shot_gsm8k
from
sglang.test.test_utils
import
(
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestDeepseekTP2
(
unittest
.
TestCase
):
class
TestDeepseekTP2
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
"lmsys/sglang-ci-dsv3-test"
...
...
test/srt/test_modelopt_fp8kvcache.py
View file @
15ddd843
...
...
@@ -6,9 +6,10 @@ from sglang.srt.layers.quantization.modelopt_quant import (
ModelOptFp8Config
,
ModelOptFp8KVCacheMethod
,
)
from
sglang.test.test_utils
import
CustomTestCase
class
TestModelOptFp8KVCacheMethod
(
unittest
.
TestCase
):
class
TestModelOptFp8KVCacheMethod
(
Custom
TestCase
):
def
test_kv_cache_method_initialization
(
self
):
"""Test that ModelOptFp8KVCacheMethod can be instantiated and
inherits from BaseKVCacheMethod."""
...
...
test/srt/test_models_from_modelscope.py
View file @
15ddd843
...
...
@@ -5,9 +5,10 @@ import unittest
from
unittest
import
mock
from
sglang.srt.utils
import
prepare_model_and_tokenizer
from
sglang.test.test_utils
import
CustomTestCase
class
TestDownloadFromModelScope
(
unittest
.
TestCase
):
class
TestDownloadFromModelScope
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
...
...
test/srt/test_moe_deepep.py
View file @
15ddd843
...
...
@@ -7,11 +7,12 @@ from sglang.test.test_utils import (
DEFAULT_MLA_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestDeepEPMoE
(
unittest
.
TestCase
):
class
TestDeepEPMoE
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_MLA_MODEL_NAME_FOR_TEST
...
...
test/srt/test_moe_ep.py
View file @
15ddd843
...
...
@@ -7,11 +7,12 @@ from sglang.test.test_utils import (
DEFAULT_MLA_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestEpMoE
(
unittest
.
TestCase
):
class
TestEpMoE
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_MLA_MODEL_NAME_FOR_TEST
...
...
@@ -59,7 +60,7 @@ class TestEpMoE(unittest.TestCase):
self
.
assertGreater
(
metrics
[
"score"
],
0.8
)
class
TestEpMoEFP8
(
unittest
.
TestCase
):
class
TestEpMoEFP8
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_MLA_MODEL_NAME_FOR_TEST
...
...
test/srt/test_moe_eval_accuracy_large.py
View file @
15ddd843
...
...
@@ -12,13 +12,14 @@ from sglang.test.test_utils import (
DEFAULT_MOE_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
is_in_ci
,
popen_launch_server
,
write_github_step_summary
,
)
class
TestMoEEvalAccuracyLarge
(
unittest
.
TestCase
):
class
TestMoEEvalAccuracyLarge
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_MOE_MODEL_NAME_FOR_TEST
...
...
test/srt/test_nightly_gsm8k_eval.py
View file @
15ddd843
...
...
@@ -15,6 +15,7 @@ from sglang.test.test_utils import (
DEFAULT_MODEL_NAME_FOR_NIGHTLY_EVAL_TP2
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
is_in_ci
,
popen_launch_server
,
write_github_step_summary
,
...
...
@@ -129,7 +130,7 @@ def check_model_scores(results):
raise
AssertionError
(
"
\n
"
.
join
(
failed_models
))
class
TestNightlyGsm8KEval
(
unittest
.
TestCase
):
class
TestNightlyGsm8KEval
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model_groups
=
[
...
...
test/srt/test_nightly_human_eval.py
View file @
15ddd843
...
...
@@ -14,11 +14,12 @@ from sglang.test.test_utils import (
DEFAULT_MODEL_NAME_FOR_NIGHTLY_EVAL_TP2
,
DEFAULT_MODEL_NAME_FOR_TEST
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
is_in_ci
,
)
class
TestNightlyHumanEval
(
unittest
.
TestCase
):
class
TestNightlyHumanEval
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
if
is_in_ci
():
...
...
test/srt/test_nightly_math_eval.py
View file @
15ddd843
...
...
@@ -7,11 +7,12 @@ from sglang.test.test_utils import (
DEFAULT_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestEvalAccuracyLarge
(
unittest
.
TestCase
):
class
TestEvalAccuracyLarge
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_MODEL_NAME_FOR_TEST
...
...
test/srt/test_no_chunked_prefill.py
View file @
15ddd843
...
...
@@ -2,12 +2,13 @@ import unittest
from
sglang.test.test_utils
import
(
DEFAULT_MODEL_NAME_FOR_TEST
,
CustomTestCase
,
run_bench_serving
,
run_mmlu_test
,
)
class
TestNoChunkedPrefill
(
unittest
.
TestCase
):
class
TestNoChunkedPrefill
(
Custom
TestCase
):
def
test_no_chunked_prefill
(
self
):
run_mmlu_test
(
...
...
test/srt/test_no_overlap_scheduler.py
View file @
15ddd843
...
...
@@ -6,10 +6,10 @@ python3 test_overlap_schedule.py
import
unittest
from
sglang.test.test_utils
import
run_mmlu_test
from
sglang.test.test_utils
import
CustomTestCase
,
run_mmlu_test
class
TestOverlapSchedule
(
unittest
.
TestCase
):
class
TestOverlapSchedule
(
Custom
TestCase
):
def
test_no_radix_attention_chunked_prefill
(
self
):
run_mmlu_test
(
disable_radix_cache
=
True
,
chunked_prefill_size
=
32
,
disable_overlap
=
True
...
...
test/srt/test_openai_server.py
View file @
15ddd843
...
...
@@ -18,11 +18,12 @@ from sglang.test.test_utils import (
DEFAULT_SMALL_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestOpenAIServer
(
unittest
.
TestCase
):
class
TestOpenAIServer
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_SMALL_MODEL_NAME_FOR_TEST
...
...
@@ -541,7 +542,7 @@ The SmartHome Mini is a compact smart home assistant available in black or white
# EBNF Test Class: TestOpenAIServerEBNF
# Launches the server with xgrammar, has only EBNF tests
# -------------------------------------------------------------------------
class
TestOpenAIServerEBNF
(
unittest
.
TestCase
):
class
TestOpenAIServerEBNF
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_SMALL_MODEL_NAME_FOR_TEST
...
...
@@ -624,7 +625,7 @@ class TestOpenAIServerEBNF(unittest.TestCase):
)
class
TestOpenAIEmbedding
(
unittest
.
TestCase
):
class
TestOpenAIEmbedding
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
cls
.
model
=
DEFAULT_SMALL_EMBEDDING_MODEL_NAME_FOR_TEST
...
...
test/srt/test_page_size.py
View file @
15ddd843
...
...
@@ -8,11 +8,12 @@ from sglang.test.test_utils import (
DEFAULT_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
popen_launch_server
,
)
class
TestPageSize
(
unittest
.
TestCase
):
class
TestPageSize
(
Custom
TestCase
):
@
classmethod
def
setUpClass
(
cls
):
os
.
environ
[
"SGLANG_DEBUG_MEMORY_POOL"
]
=
"1"
...
...
Prev
1
2
3
4
5
6
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment