test_srt_backend.py 1.68 KB
Newer Older
Lianmin Zheng's avatar
Lianmin Zheng committed
1
2
import unittest

Liangsheng Yin's avatar
Liangsheng Yin committed
3
import sglang as sgl
Lianmin Zheng's avatar
Lianmin Zheng committed
4
5
from sglang.test.test_programs import (
    test_decode_int,
6
    test_decode_json_regex,
7
    test_dtype_gen,
Lianmin Zheng's avatar
Lianmin Zheng committed
8
9
    test_expert_answer,
    test_few_shot_qa,
10
    test_gen_min_new_tokens,
11
    test_hellaswag_select,
Lianmin Zheng's avatar
Lianmin Zheng committed
12
13
14
15
16
17
18
    test_mt_bench,
    test_parallel_decoding,
    test_regex,
    test_select,
    test_stream,
    test_tool_use,
)
Ying Sheng's avatar
Ying Sheng committed
19
from sglang.test.test_utils import DEFAULT_MODEL_NAME_FOR_TEST
Lianmin Zheng's avatar
Lianmin Zheng committed
20
21
22
23
24


class TestSRTBackend(unittest.TestCase):
    backend = None

25
26
    @classmethod
    def setUpClass(cls):
Ying Sheng's avatar
Ying Sheng committed
27
        cls.backend = sgl.Runtime(model_path=DEFAULT_MODEL_NAME_FOR_TEST)
28
        sgl.set_default_backend(cls.backend)
Lianmin Zheng's avatar
Lianmin Zheng committed
29

30
31
32
    @classmethod
    def tearDownClass(cls):
        cls.backend.shutdown()
Lianmin Zheng's avatar
Lianmin Zheng committed
33
34
35
36
37
38
39
40
41
42
43
44
45

    def test_few_shot_qa(self):
        test_few_shot_qa()

    def test_mt_bench(self):
        test_mt_bench()

    def test_select(self):
        test_select(check_answer=False)

    def test_decode_int(self):
        test_decode_int()

46
47
48
    def test_decode_json_regex(self):
        test_decode_json_regex()

Lianmin Zheng's avatar
Lianmin Zheng committed
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
    def test_expert_answer(self):
        test_expert_answer()

    def test_tool_use(self):
        test_tool_use()

    def test_parallel_decoding(self):
        test_parallel_decoding()

    def test_stream(self):
        test_stream()

    def test_regex(self):
        test_regex()

64
65
66
    def test_dtype_gen(self):
        test_dtype_gen()

67
68
69
70
    def test_hellaswag_select(self):
        # Run twice to capture more bugs
        for _ in range(2):
            accuracy, latency = test_hellaswag_select()
71
            assert accuracy > 0.71, f"{accuracy=}"
72

73
74
75
    def test_gen_min_new_tokens(self):
        test_gen_min_new_tokens()

Lianmin Zheng's avatar
Lianmin Zheng committed
76
77

if __name__ == "__main__":
Lianmin Zheng's avatar
Lianmin Zheng committed
78
    unittest.main()