Add check for token_type_ids before tensorizing

Fix an issue where `prepare_for_model()` gives a `KeyError` when `return_token_type_ids` is set to `False` and `return_tensors` is enabled.

Add check for token_type_ids before tensorizing
Fix an issue where `prepare_for_model()` gives a `KeyError` when `return_token_type_ids` is set to `False` and `return_tensors` is enabled.
c76c3ceb · Aditya Bhargava · Lysandre Debut · eb59e9f7 · c76c3ceb
Commit c76c3ceb authored Jan 08, 2020 by Aditya Bhargava Committed by Lysandre Debut Jan 15, 2020
Show whitespace changes
Inline Side-by-side

Showing with 6 additions and 2 deletions

src/transformers/tokenization_utils.py src/transformers/tokenization_utils.py +6 -2

No files found.
--- a/src/transformers/tokenization_utils.py
+++ b/src/transformers/tokenization_utils.py
@@ -1194,6 +1194,8 @@ class PreTrainedTokenizer(object):
        # Prepare inputs as tensors if asked
        if return_tensors == "tf" and is_tf_available():
            encoded_inputs["input_ids"] = tf.constant([encoded_inputs["input_ids"]])
+            if "token_type_ids" in encoded_inputs:
                encoded_inputs["token_type_ids"] = tf.constant([encoded_inputs["token_type_ids"]])
            if "attention_mask" in encoded_inputs:
@@ -1201,6 +1203,8 @@ class PreTrainedTokenizer(object):
        elif return_tensors == "pt" and is_torch_available():
            encoded_inputs["input_ids"] = torch.tensor([encoded_inputs["input_ids"]])
+            if "token_type_ids" in encoded_inputs:
                encoded_inputs["token_type_ids"] = torch.tensor([encoded_inputs["token_type_ids"]])
            if "attention_mask" in encoded_inputs: