test_pipelines_text_generation.py 2.78 KB
Newer Older
Sylvain Gugger's avatar
Sylvain Gugger committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
# Copyright 2020 The HuggingFace Team. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

15
16
import unittest

17
from transformers import pipeline
18
from transformers.testing_utils import require_torch
19

20
21
22
23
24
25
26
27
from .test_pipelines_common import MonoInputPipelineCommonMixin


class TextGenerationPipelineTests(MonoInputPipelineCommonMixin, unittest.TestCase):
    pipeline_task = "text-generation"
    pipeline_running_kwargs = {"prefix": "This is "}
    small_models = ["sshleifer/tiny-ctrl"]  # Models tested without the @slow decorator
    large_models = []  # Models tested with the @slow decorator
28
29

    def test_simple_generation(self):
30
        text_generator = pipeline(task="text-generation", model=self.small_models[0])
31
32
        # text-generation is non-deterministic by nature, we can't fully test the output

33
        outputs = text_generator("This is a test")
34
35
36
37
38

        self.assertEqual(len(outputs), 1)
        self.assertEqual(list(outputs[0].keys()), ["generated_text"])
        self.assertEqual(type(outputs[0]["generated_text"]), str)

39
        outputs = text_generator(["This is a test", "This is a second test"])
40
41
42
43
44
        self.assertEqual(len(outputs[0]), 1)
        self.assertEqual(list(outputs[0][0].keys()), ["generated_text"])
        self.assertEqual(type(outputs[0][0]["generated_text"]), str)
        self.assertEqual(list(outputs[1][0].keys()), ["generated_text"])
        self.assertEqual(type(outputs[1][0]["generated_text"]), str)
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62

    @require_torch
    def test_generation_output_style(self):
        text_generator = pipeline(task="text-generation", model=self.small_models[0])
        # text-generation is non-deterministic by nature, we can't fully test the output

        outputs = text_generator("This is a test")
        self.assertIn("This is a test", outputs[0]["generated_text"])

        outputs = text_generator("This is a test", return_full_text=False)
        self.assertNotIn("This is a test", outputs[0]["generated_text"])

        text_generator = pipeline(task="text-generation", model=self.small_models[0], return_full_text=False)
        outputs = text_generator("This is a test")
        self.assertNotIn("This is a test", outputs[0]["generated_text"])

        outputs = text_generator("This is a test", return_full_text=True)
        self.assertIn("This is a test", outputs[0]["generated_text"])