Whisper: move to tensor cpu before converting to np array at decode time (#31954)

a5c642fe · Joao Gante · GitHub · df1c248a · a5c642fe · a5c642fe
Unverified Commit a5c642fe authored Jul 14, 2024 by Joao Gante Committed by GitHub Jul 14, 2024
2 changed files
--- a/src/transformers/models/whisper/tokenization_whisper.py
+++ b/src/transformers/models/whisper/tokenization_whisper.py
@@ -872,8 +872,11 @@ class WhisperTokenizer(PreTrainedTokenizer):
    @staticmethod
    def _convert_to_list(token_ids):
        # convert type to ndarray if necessary
-        if "torch" in str(type(token_ids)) or "tensorflow" in str(type(token_ids)) and hasattr(token_ids, "numpy"):
+        if hasattr(token_ids, "numpy"):
-            token_ids = token_ids.numpy()
+            if "torch" in str(type(token_ids)):
+                token_ids = token_ids.cpu().numpy()
+            elif "tensorflow" in str(type(token_ids)):
+                token_ids = token_ids.numpy()
        # now the token ids are either a numpy array, or a list of lists
        if isinstance(token_ids, np.ndarray):
            token_ids = token_ids.tolist()

--- a/src/transformers/models/whisper/tokenization_whisper_fast.py
+++ b/src/transformers/models/whisper/tokenization_whisper_fast.py
@@ -605,8 +605,11 @@ class WhisperTokenizerFast(PreTrainedTokenizerFast):
    # Copied from transformers.models.whisper.tokenization_whisper.WhisperTokenizer._convert_to_list
    def _convert_to_list(token_ids):
        # convert type to ndarray if necessary
-        if "torch" in str(type(token_ids)) or "tensorflow" in str(type(token_ids)) and hasattr(token_ids, "numpy"):
+        if hasattr(token_ids, "numpy"):
-            token_ids = token_ids.numpy()
+            if "torch" in str(type(token_ids)):
+                token_ids = token_ids.cpu().numpy()
+            elif "tensorflow" in str(type(token_ids)):
+                token_ids = token_ids.numpy()
        # now the token ids are either a numpy array, or a list of lists
        if isinstance(token_ids, np.ndarray):
            token_ids = token_ids.tolist()