test_srt_backend.py 1.77 KB
Newer Older
1
2
3
4
5
"""
Usage:
python3 -m unittest test_srt_backend.TestSRTBackend.test_gen_min_new_tokens
"""

Lianmin Zheng's avatar
Lianmin Zheng committed
6
7
import unittest

Liangsheng Yin's avatar
Liangsheng Yin committed
8
import sglang as sgl
Lianmin Zheng's avatar
Lianmin Zheng committed
9
10
from sglang.test.test_programs import (
    test_decode_int,
11
    test_decode_json_regex,
12
    test_dtype_gen,
Lianmin Zheng's avatar
Lianmin Zheng committed
13
14
    test_expert_answer,
    test_few_shot_qa,
15
    test_gen_min_new_tokens,
16
    test_hellaswag_select,
Lianmin Zheng's avatar
Lianmin Zheng committed
17
18
19
20
21
22
23
    test_mt_bench,
    test_parallel_decoding,
    test_regex,
    test_select,
    test_stream,
    test_tool_use,
)
Ying Sheng's avatar
Ying Sheng committed
24
from sglang.test.test_utils import DEFAULT_MODEL_NAME_FOR_TEST
Lianmin Zheng's avatar
Lianmin Zheng committed
25
26
27
28
29


class TestSRTBackend(unittest.TestCase):
    backend = None

30
31
    @classmethod
    def setUpClass(cls):
Ying Sheng's avatar
Ying Sheng committed
32
        cls.backend = sgl.Runtime(model_path=DEFAULT_MODEL_NAME_FOR_TEST)
33
        sgl.set_default_backend(cls.backend)
Lianmin Zheng's avatar
Lianmin Zheng committed
34

35
36
37
    @classmethod
    def tearDownClass(cls):
        cls.backend.shutdown()
Lianmin Zheng's avatar
Lianmin Zheng committed
38
39
40
41
42
43
44
45
46
47
48
49
50

    def test_few_shot_qa(self):
        test_few_shot_qa()

    def test_mt_bench(self):
        test_mt_bench()

    def test_select(self):
        test_select(check_answer=False)

    def test_decode_int(self):
        test_decode_int()

51
52
53
    def test_decode_json_regex(self):
        test_decode_json_regex()

Lianmin Zheng's avatar
Lianmin Zheng committed
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
    def test_expert_answer(self):
        test_expert_answer()

    def test_tool_use(self):
        test_tool_use()

    def test_parallel_decoding(self):
        test_parallel_decoding()

    def test_stream(self):
        test_stream()

    def test_regex(self):
        test_regex()

69
70
71
    def test_dtype_gen(self):
        test_dtype_gen()

72
73
74
75
    def test_hellaswag_select(self):
        # Run twice to capture more bugs
        for _ in range(2):
            accuracy, latency = test_hellaswag_select()
76
            self.assertGreater(accuracy, 0.70)
77

78
79
80
    def test_gen_min_new_tokens(self):
        test_gen_min_new_tokens()

Lianmin Zheng's avatar
Lianmin Zheng committed
81
82

if __name__ == "__main__":
Lianmin Zheng's avatar
Lianmin Zheng committed
83
    unittest.main()