Fix docstring of train_new_from_iterator

a13c8145 · Omar Sanseviero · GitHub · 86a15472 · a13c8145
Unverified Commit a13c8145 authored Aug 13, 2021 by Omar Sanseviero Committed by GitHub Aug 13, 2021
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

src/transformers/tokenization_utils_fast.py src/transformers/tokenization_utils_fast.py +1 -1

No files found.
--- a/src/transformers/tokenization_utils_fast.py
+++ b/src/transformers/tokenization_utils_fast.py
@@ -587,7 +587,7 @@ class PreTrainedTokenizerFast(PreTrainedTokenizerBase):
            text_iterator (generator of :obj:`List[str]`):
                The training corpus. Should be a generator of batches of texts, for instance a list of lists of texts
                if you have everything in memory.
-            vocab_size (obj:`int`):
+            vocab_size (:obj:`int`):
                The size of the vocabulary you want for your tokenizer.
            new_special_tokens (list of :obj:`str` or :obj:`AddedToken`, `optional`):
                A list of new special tokens to add to the tokenizer you are training.