Decode documentaton

7bddb45a · LysandreJik · b3cfd979 · 7bddb45a
Commit 7bddb45a authored Oct 04, 2019 by LysandreJik
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 0 deletions

transformers/tokenization_utils.py transformers/tokenization_utils.py +5 -0

No files found.
--- a/transformers/tokenization_utils.py
+++ b/transformers/tokenization_utils.py
@@ -912,6 +912,11 @@ class PreTrainedTokenizer(object):
        Converts a sequence of ids (integer) in a string, using the tokenizer and vocabulary
        with options to remove special tokens and clean up tokenization spaces.
        Similar to doing ``self.convert_tokens_to_string(self.convert_ids_to_tokens(token_ids))``.
+        Args:
+            token_ids: list of tokenized input ids. Can be obtained using the `encode` or `encode_plus` methods.
+            skip_special_tokens: if set to True, will replace special tokens.
+            clean_up_tokenization_spaces: if set to True, will clean up the tokenization spaces.
        """
        filtered_tokens = self.convert_ids_to_tokens(token_ids, skip_special_tokens=skip_special_tokens)