test_stopping_criteria.py 4.17 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
# coding=utf-8
# Copyright 2020 The HuggingFace Team Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a clone of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

16
17
18
19
20
21
import time
import unittest

from transformers import is_torch_available
from transformers.testing_utils import require_torch, torch_device

22
from ..test_modeling_common import ids_tensor
23
24
25
26
27


if is_torch_available():
    import torch

28
    from transformers.generation import (
29
        EosTokenCriteria,
30
        MaxLengthCriteria,
31
        MaxNewTokensCriteria,
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
        MaxTimeCriteria,
        StoppingCriteriaList,
        validate_stopping_criteria,
    )


@require_torch
class StoppingCriteriaTestCase(unittest.TestCase):
    def _get_tensors(self, length):
        batch_size = 3
        vocab_size = 250

        input_ids = ids_tensor((batch_size, length), vocab_size)
        scores = torch.ones((batch_size, length), device=torch_device, dtype=torch.float) / length
        return input_ids, scores

    def test_list_criteria(self):
        input_ids, scores = self._get_tensors(5)

        criteria = StoppingCriteriaList(
            [
                MaxLengthCriteria(max_length=10),
                MaxTimeCriteria(max_time=0.1),
            ]
        )

58
        self.assertFalse(all(criteria(input_ids, scores)))
59

60
        input_ids, scores = self._get_tensors(9)
61
        self.assertFalse(all(criteria(input_ids, scores)))
62

63
        input_ids, scores = self._get_tensors(10)
64
        self.assertTrue(all(criteria(input_ids, scores)))
65
66
67
68
69

    def test_max_length_criteria(self):
        criteria = MaxLengthCriteria(max_length=10)

        input_ids, scores = self._get_tensors(5)
70
        self.assertFalse(all(criteria(input_ids, scores)))
71

72
        input_ids, scores = self._get_tensors(9)
73
        self.assertFalse(all(criteria(input_ids, scores)))
74

75
        input_ids, scores = self._get_tensors(10)
76
        self.assertTrue(all(criteria(input_ids, scores)))
77

78
79
80
81
    def test_max_new_tokens_criteria(self):
        criteria = MaxNewTokensCriteria(start_length=5, max_new_tokens=5)

        input_ids, scores = self._get_tensors(5)
82
        self.assertFalse(all(criteria(input_ids, scores)))
83
84

        input_ids, scores = self._get_tensors(9)
85
        self.assertFalse(all(criteria(input_ids, scores)))
86
87

        input_ids, scores = self._get_tensors(10)
88
        self.assertTrue(all(criteria(input_ids, scores)))
89
90
91
92

        criteria_list = StoppingCriteriaList([criteria])
        self.assertEqual(criteria_list.max_length, 10)

93
94
95
96
    def test_max_time_criteria(self):
        input_ids, scores = self._get_tensors(5)

        criteria = MaxTimeCriteria(max_time=0.1)
97
        self.assertFalse(all(criteria(input_ids, scores)))
98
99

        criteria = MaxTimeCriteria(max_time=0.1, initial_timestamp=time.time() - 0.2)
100
        self.assertTrue(all(criteria(input_ids, scores)))
101

102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
    def test_eos_token_criteria(self):
        criteria = EosTokenCriteria(eos_token_id=0)

        input_ids, scores = self._get_tensors(5)
        input_ids[:, -1] = 0
        self.assertTrue(all(criteria(input_ids, scores)))

        input_ids, scores = self._get_tensors(5)
        input_ids[:2, -1] = 0
        input_ids[2, -1] = 1
        self.assertListEqual(criteria(input_ids, scores).tolist(), [True, True, False])

        input_ids, scores = self._get_tensors(5)
        input_ids[:, -1] = 1
        self.assertListEqual(criteria(input_ids, scores).tolist(), [False, False, False])

118
119
120
121
122
123
    def test_validate_stopping_criteria(self):
        validate_stopping_criteria(StoppingCriteriaList([MaxLengthCriteria(10)]), 10)

        with self.assertWarns(UserWarning):
            validate_stopping_criteria(StoppingCriteriaList([MaxLengthCriteria(10)]), 11)

124
        stopping_criteria = validate_stopping_criteria(StoppingCriteriaList(), 11)
125
126

        self.assertEqual(len(stopping_criteria), 1)