Support single token decode for `CodeGenTokenizer` (#28628)

convert token id to list in .decode()

Support single token decode for `CodeGenTokenizer` (#28628)
convert token id to list in .decode()
9a4521dd · cmathw · GitHub · 5b5e71dc · 9a4521dd
Unverified Commit 9a4521dd authored Jan 23, 2024 by cmathw Committed by GitHub Jan 23, 2024
Show whitespace changes
Inline Side-by-side

Showing with 4 additions and 1 deletion

src/transformers/models/codegen/tokenization_codegen.py src/transformers/models/codegen/tokenization_codegen.py +4 -1

No files found.
--- a/src/transformers/models/codegen/tokenization_codegen.py
+++ b/src/transformers/models/codegen/tokenization_codegen.py
@@ -23,7 +23,7 @@ from typing import TYPE_CHECKING, List, Optional, Tuple, Union
 import numpy as np
 import regex as re
-from ...utils import is_tf_available, is_torch_available, logging
+from ...utils import is_tf_available, is_torch_available, logging, to_py_obj
 if TYPE_CHECKING:
@@ -352,6 +352,9 @@ class CodeGenTokenizer(PreTrainedTokenizer):
        Returns:
            `str`: The decoded sentence.
        """
+        token_ids = to_py_obj(token_ids)
        decoded_text = super()._decode(
            token_ids=token_ids,
            skip_special_tokens=skip_special_tokens,