Fix #1597

777faa8a · Lysandre · b8c9ea00 · 777faa8a
Commit 777faa8a authored Oct 22, 2019 by Lysandre
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 5 deletions

transformers/tokenization_ctrl.py transformers/tokenization_ctrl.py +1 -5

No files found.
--- a/transformers/tokenization_ctrl.py
+++ b/transformers/tokenization_ctrl.py
@@ -63,11 +63,7 @@ def get_pairs(word):
 class CTRLTokenizer(PreTrainedTokenizer):
    """
    CTRL BPE tokenizer. Peculiarities:
-        - Byte-level Byte-Pair-Encoding
+        - Byte-Pair-Encoding
-        - Requires a space to start the input string => the encoding methods should be called with the
-          ``add_prefix_space`` flag set to ``True``.
-          Otherwise, this tokenizer ``encode`` and ``decode`` method will not conserve
-          the absence of a space at the beginning of a string: `tokenizer.decode(tokenizer.encode("Hello")) = " Hello"`
    """
    vocab_files_names = VOCAB_FILES_NAMES
    pretrained_vocab_files_map = PRETRAINED_VOCAB_FILES_MAP