test_srt_backend.py 1.58 KB
Newer Older
Lianmin Zheng's avatar
Lianmin Zheng committed
1
2
import unittest

Liangsheng Yin's avatar
Liangsheng Yin committed
3
import sglang as sgl
Lianmin Zheng's avatar
Lianmin Zheng committed
4
5
from sglang.test.test_programs import (
    test_decode_int,
6
    test_decode_json_regex,
7
    test_dtype_gen,
Lianmin Zheng's avatar
Lianmin Zheng committed
8
9
    test_expert_answer,
    test_few_shot_qa,
10
    test_hellaswag_select,
Lianmin Zheng's avatar
Lianmin Zheng committed
11
12
13
14
15
16
17
    test_mt_bench,
    test_parallel_decoding,
    test_regex,
    test_select,
    test_stream,
    test_tool_use,
)
Ying Sheng's avatar
Ying Sheng committed
18
from sglang.test.test_utils import DEFAULT_MODEL_NAME_FOR_TEST
Lianmin Zheng's avatar
Lianmin Zheng committed
19
20
21
22
23


class TestSRTBackend(unittest.TestCase):
    backend = None

24
25
    @classmethod
    def setUpClass(cls):
Ying Sheng's avatar
Ying Sheng committed
26
        cls.backend = sgl.Runtime(model_path=DEFAULT_MODEL_NAME_FOR_TEST)
27
        sgl.set_default_backend(cls.backend)
Lianmin Zheng's avatar
Lianmin Zheng committed
28

29
30
31
    @classmethod
    def tearDownClass(cls):
        cls.backend.shutdown()
Lianmin Zheng's avatar
Lianmin Zheng committed
32
33
34
35
36
37
38
39
40
41
42
43
44

    def test_few_shot_qa(self):
        test_few_shot_qa()

    def test_mt_bench(self):
        test_mt_bench()

    def test_select(self):
        test_select(check_answer=False)

    def test_decode_int(self):
        test_decode_int()

45
46
47
    def test_decode_json_regex(self):
        test_decode_json_regex()

Lianmin Zheng's avatar
Lianmin Zheng committed
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
    def test_expert_answer(self):
        test_expert_answer()

    def test_tool_use(self):
        test_tool_use()

    def test_parallel_decoding(self):
        test_parallel_decoding()

    def test_stream(self):
        test_stream()

    def test_regex(self):
        test_regex()

63
64
65
    def test_dtype_gen(self):
        test_dtype_gen()

66
67
68
69
    def test_hellaswag_select(self):
        # Run twice to capture more bugs
        for _ in range(2):
            accuracy, latency = test_hellaswag_select()
70
            assert accuracy > 0.71, f"{accuracy=}"
71

Lianmin Zheng's avatar
Lianmin Zheng committed
72
73

if __name__ == "__main__":
Lianmin Zheng's avatar
Lianmin Zheng committed
74
    unittest.main()