test_ngram.py 3.07 KB
Newer Older
1
2
# SPDX-License-Identifier: Apache-2.0

3
import numpy as np
4

5
6
from vllm.v1.spec_decode.ngram_proposer import (NgramProposer,
                                                _find_subarray_kmp,
7
                                                _kmp_lps_array)
8
9


10
11
12
13
14
15
16
17
18
def test_kmp_lps_array():
    np.testing.assert_array_equal(_kmp_lps_array(np.array([])), np.array([]))
    np.testing.assert_array_equal(_kmp_lps_array(np.array([1])), np.array([0]))
    np.testing.assert_array_equal(_kmp_lps_array(np.array([1, 1, 1])),
                                  np.array([0, 1, 2]))
    np.testing.assert_array_equal(_kmp_lps_array(np.array([1, 2, 3, 4])),
                                  np.array([0, 0, 0, 0]))
    np.testing.assert_array_equal(_kmp_lps_array(np.array([1, 2, 1, 2, 3])),
                                  np.array([0, 0, 1, 2, 0]))
19
20


21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
def test_find_subarray_kmp():
    X = np.array([1, 2, 3, 4, 1, 2, 3, 5, 6])
    assert _find_subarray_kmp(X, 2, 2) is None
    X = np.array([1, 2, 3, 4, 1, 2, 3])
    np.testing.assert_array_equal(_find_subarray_kmp(X, 2, 3),
                                  np.array([4, 1, 2]))
    np.testing.assert_array_equal(_find_subarray_kmp(X, 2, 2), np.array([4,
                                                                         1]))
    np.testing.assert_array_equal(_find_subarray_kmp(X, 1, 3),
                                  np.array([4, 1, 2]))
    np.testing.assert_array_equal(_find_subarray_kmp(X, 1, 2), np.array([4,
                                                                         1]))
    X = np.array([1, 3, 6, 2, 3, 4, 1, 2, 3])
    np.testing.assert_array_equal(_find_subarray_kmp(X, 2, 3),
                                  np.array([4, 1, 2]))
36
    # Return on the first match
37
38
    np.testing.assert_array_equal(_find_subarray_kmp(X, 1, 3),
                                  np.array([6, 2, 3]))
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88


def test_ngram_proposer():
    proposer = NgramProposer()

    # No match.
    result = proposer.propose(
        context_token_ids=np.array([1, 2, 3, 4, 5]),
        min_n=2,
        max_n=2,
        k=2,
    )
    assert result is None

    # No match for 4-gram.
    result = proposer.propose(
        context_token_ids=np.array([1, 2, 3, 4, 1, 2, 3]),
        min_n=4,
        max_n=4,
        k=2,
    )
    assert result is None

    # No match for 4-gram but match for 3-gram.
    result = proposer.propose(
        context_token_ids=np.array([1, 2, 3, 4, 1, 2, 3]),
        min_n=3,
        max_n=4,
        k=2,
    )
    assert np.array_equal(result, np.array([4, 1]))

    # Match for both 4-gram and 3-gram.
    # In this case, the proposer should return the 4-gram match.
    result = proposer.propose(
        context_token_ids=np.array([2, 3, 4, 5, 1, 2, 3, 4, 1, 2, 3, 4]),
        min_n=3,
        max_n=4,
        k=2,
    )
    assert np.array_equal(result, np.array([1, 2]))  # Not [5, 1]

    # Match for 2-gram and 3-gram, but not 4-gram.
    result = proposer.propose(
        context_token_ids=np.array([3, 4, 5, 2, 3, 4, 1, 2, 3, 4]),
        min_n=2,
        max_n=4,
        k=2,
    )
    assert np.array_equal(result, np.array([1, 2]))  # Not [5, 2]