Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
chenpangpang
transformers
Commits
3e07196f
Unverified
Commit
3e07196f
authored
Oct 18, 2022
by
Arthur
Committed by
GitHub
Oct 18, 2022
Browse files
check decoder_inputs_embeds is None before shifting labels (#19671)
parent
d356b89f
Changes
21
Show whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
20 additions
and
20 deletions
+20
-20
src/transformers/models/bart/modeling_tf_bart.py
src/transformers/models/bart/modeling_tf_bart.py
+1
-1
src/transformers/models/blenderbot/modeling_blenderbot.py
src/transformers/models/blenderbot/modeling_blenderbot.py
+1
-1
src/transformers/models/blenderbot/modeling_tf_blenderbot.py
src/transformers/models/blenderbot/modeling_tf_blenderbot.py
+1
-1
src/transformers/models/blenderbot_small/modeling_blenderbot_small.py
...mers/models/blenderbot_small/modeling_blenderbot_small.py
+1
-1
src/transformers/models/blenderbot_small/modeling_tf_blenderbot_small.py
...s/models/blenderbot_small/modeling_tf_blenderbot_small.py
+1
-1
src/transformers/models/led/modeling_led.py
src/transformers/models/led/modeling_led.py
+1
-1
src/transformers/models/led/modeling_tf_led.py
src/transformers/models/led/modeling_tf_led.py
+1
-1
src/transformers/models/marian/modeling_marian.py
src/transformers/models/marian/modeling_marian.py
+1
-1
src/transformers/models/marian/modeling_tf_marian.py
src/transformers/models/marian/modeling_tf_marian.py
+1
-1
src/transformers/models/mbart/modeling_mbart.py
src/transformers/models/mbart/modeling_mbart.py
+1
-1
src/transformers/models/mbart/modeling_tf_mbart.py
src/transformers/models/mbart/modeling_tf_mbart.py
+1
-1
src/transformers/models/pegasus/modeling_pegasus.py
src/transformers/models/pegasus/modeling_pegasus.py
+1
-1
src/transformers/models/pegasus/modeling_tf_pegasus.py
src/transformers/models/pegasus/modeling_tf_pegasus.py
+1
-1
src/transformers/models/pegasus_x/modeling_pegasus_x.py
src/transformers/models/pegasus_x/modeling_pegasus_x.py
+1
-1
src/transformers/models/plbart/modeling_plbart.py
src/transformers/models/plbart/modeling_plbart.py
+1
-1
src/transformers/models/speech_to_text/modeling_speech_to_text.py
...sformers/models/speech_to_text/modeling_speech_to_text.py
+1
-1
src/transformers/models/speech_to_text/modeling_tf_speech_to_text.py
...rmers/models/speech_to_text/modeling_tf_speech_to_text.py
+1
-1
src/transformers/models/whisper/modeling_tf_whisper.py
src/transformers/models/whisper/modeling_tf_whisper.py
+1
-1
src/transformers/models/whisper/modeling_whisper.py
src/transformers/models/whisper/modeling_whisper.py
+1
-1
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/modeling_tf_{{cookiecutter.lowercase_modelname}}.py
...ame}}/modeling_tf_{{cookiecutter.lowercase_modelname}}.py
+1
-1
No files found.
src/transformers/models/bart/modeling_tf_bart.py
View file @
3e07196f
...
@@ -1352,7 +1352,7 @@ class TFBartForConditionalGeneration(TFBartPretrainedModel, TFCausalLanguageMode
...
@@ -1352,7 +1352,7 @@ class TFBartForConditionalGeneration(TFBartPretrainedModel, TFCausalLanguageMode
labels
,
labels
,
)
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/blenderbot/modeling_blenderbot.py
View file @
3e07196f
...
@@ -1319,7 +1319,7 @@ class BlenderbotForConditionalGeneration(BlenderbotPreTrainedModel):
...
@@ -1319,7 +1319,7 @@ class BlenderbotForConditionalGeneration(BlenderbotPreTrainedModel):
if
use_cache
:
if
use_cache
:
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/blenderbot/modeling_tf_blenderbot.py
View file @
3e07196f
...
@@ -1371,7 +1371,7 @@ class TFBlenderbotForConditionalGeneration(TFBlenderbotPreTrainedModel, TFCausal
...
@@ -1371,7 +1371,7 @@ class TFBlenderbotForConditionalGeneration(TFBlenderbotPreTrainedModel, TFCausal
labels
,
labels
,
)
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/blenderbot_small/modeling_blenderbot_small.py
View file @
3e07196f
...
@@ -1286,7 +1286,7 @@ class BlenderbotSmallForConditionalGeneration(BlenderbotSmallPreTrainedModel):
...
@@ -1286,7 +1286,7 @@ class BlenderbotSmallForConditionalGeneration(BlenderbotSmallPreTrainedModel):
if
use_cache
:
if
use_cache
:
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/blenderbot_small/modeling_tf_blenderbot_small.py
View file @
3e07196f
...
@@ -1351,7 +1351,7 @@ class TFBlenderbotSmallForConditionalGeneration(TFBlenderbotSmallPreTrainedModel
...
@@ -1351,7 +1351,7 @@ class TFBlenderbotSmallForConditionalGeneration(TFBlenderbotSmallPreTrainedModel
labels
,
labels
,
)
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/led/modeling_led.py
View file @
3e07196f
...
@@ -2428,7 +2428,7 @@ class LEDForConditionalGeneration(LEDPreTrainedModel):
...
@@ -2428,7 +2428,7 @@ class LEDForConditionalGeneration(LEDPreTrainedModel):
if
use_cache
:
if
use_cache
:
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/led/modeling_tf_led.py
View file @
3e07196f
...
@@ -2445,7 +2445,7 @@ class TFLEDForConditionalGeneration(TFLEDPreTrainedModel):
...
@@ -2445,7 +2445,7 @@ class TFLEDForConditionalGeneration(TFLEDPreTrainedModel):
if
labels
is
not
None
:
if
labels
is
not
None
:
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/marian/modeling_marian.py
View file @
3e07196f
...
@@ -1432,7 +1432,7 @@ class MarianMTModel(MarianPreTrainedModel):
...
@@ -1432,7 +1432,7 @@ class MarianMTModel(MarianPreTrainedModel):
if
use_cache
:
if
use_cache
:
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/marian/modeling_tf_marian.py
View file @
3e07196f
...
@@ -1388,7 +1388,7 @@ class TFMarianMTModel(TFMarianPreTrainedModel, TFCausalLanguageModelingLoss):
...
@@ -1388,7 +1388,7 @@ class TFMarianMTModel(TFMarianPreTrainedModel, TFCausalLanguageModelingLoss):
labels
,
labels
,
)
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/mbart/modeling_mbart.py
View file @
3e07196f
...
@@ -1347,7 +1347,7 @@ class MBartForConditionalGeneration(MBartPreTrainedModel):
...
@@ -1347,7 +1347,7 @@ class MBartForConditionalGeneration(MBartPreTrainedModel):
if
use_cache
:
if
use_cache
:
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
)
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
)
outputs
=
self
.
model
(
outputs
=
self
.
model
(
...
...
src/transformers/models/mbart/modeling_tf_mbart.py
View file @
3e07196f
...
@@ -1387,7 +1387,7 @@ class TFMBartForConditionalGeneration(TFMBartPreTrainedModel, TFCausalLanguageMo
...
@@ -1387,7 +1387,7 @@ class TFMBartForConditionalGeneration(TFMBartPreTrainedModel, TFCausalLanguageMo
labels
,
labels
,
)
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
)
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
)
outputs
=
self
.
model
(
outputs
=
self
.
model
(
...
...
src/transformers/models/pegasus/modeling_pegasus.py
View file @
3e07196f
...
@@ -1393,7 +1393,7 @@ class PegasusForConditionalGeneration(PegasusPreTrainedModel):
...
@@ -1393,7 +1393,7 @@ class PegasusForConditionalGeneration(PegasusPreTrainedModel):
if
use_cache
:
if
use_cache
:
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/pegasus/modeling_tf_pegasus.py
View file @
3e07196f
...
@@ -1397,7 +1397,7 @@ class TFPegasusForConditionalGeneration(TFPegasusPreTrainedModel, TFCausalLangua
...
@@ -1397,7 +1397,7 @@ class TFPegasusForConditionalGeneration(TFPegasusPreTrainedModel, TFCausalLangua
labels
,
labels
,
)
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/pegasus_x/modeling_pegasus_x.py
View file @
3e07196f
...
@@ -1605,7 +1605,7 @@ class PegasusXForConditionalGeneration(PegasusXPreTrainedModel):
...
@@ -1605,7 +1605,7 @@ class PegasusXForConditionalGeneration(PegasusXPreTrainedModel):
if
use_cache
:
if
use_cache
:
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
logger
.
warning
(
"The `use_cache` argument is changed to `False` since `labels` is provided."
)
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/plbart/modeling_plbart.py
View file @
3e07196f
...
@@ -1314,7 +1314,7 @@ class PLBartForConditionalGeneration(PLBartPreTrainedModel):
...
@@ -1314,7 +1314,7 @@ class PLBartForConditionalGeneration(PLBartPreTrainedModel):
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
if
labels
is
not
None
:
if
labels
is
not
None
:
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
)
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
)
outputs
=
self
.
model
(
outputs
=
self
.
model
(
...
...
src/transformers/models/speech_to_text/modeling_speech_to_text.py
View file @
3e07196f
...
@@ -1341,7 +1341,7 @@ class Speech2TextForConditionalGeneration(Speech2TextPreTrainedModel):
...
@@ -1341,7 +1341,7 @@ class Speech2TextForConditionalGeneration(Speech2TextPreTrainedModel):
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
if
labels
is
not
None
:
if
labels
is
not
None
:
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/speech_to_text/modeling_tf_speech_to_text.py
View file @
3e07196f
...
@@ -1405,7 +1405,7 @@ class TFSpeech2TextForConditionalGeneration(TFSpeech2TextPreTrainedModel, TFCaus
...
@@ -1405,7 +1405,7 @@ class TFSpeech2TextForConditionalGeneration(TFSpeech2TextPreTrainedModel, TFCaus
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
if
labels
is
not
None
:
if
labels
is
not
None
:
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/whisper/modeling_tf_whisper.py
View file @
3e07196f
...
@@ -1293,7 +1293,7 @@ class TFWhisperForConditionalGeneration(TFWhisperPreTrainedModel, TFCausalLangua
...
@@ -1293,7 +1293,7 @@ class TFWhisperForConditionalGeneration(TFWhisperPreTrainedModel, TFCausalLangua
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
if
labels
is
not
None
:
if
labels
is
not
None
:
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
src/transformers/models/whisper/modeling_whisper.py
View file @
3e07196f
...
@@ -1183,7 +1183,7 @@ class WhisperForConditionalGeneration(WhisperPreTrainedModel):
...
@@ -1183,7 +1183,7 @@ class WhisperForConditionalGeneration(WhisperPreTrainedModel):
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
return_dict
=
return_dict
if
return_dict
is
not
None
else
self
.
config
.
use_return_dict
if
labels
is
not
None
:
if
labels
is
not
None
:
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/modeling_tf_{{cookiecutter.lowercase_modelname}}.py
View file @
3e07196f
...
@@ -2938,7 +2938,7 @@ class TF{{cookiecutter.camelcase_modelname}}ForConditionalGeneration(TF{{cookiec
...
@@ -2938,7 +2938,7 @@ class TF{{cookiecutter.camelcase_modelname}}ForConditionalGeneration(TF{{cookiec
if
labels
is
not
None
:
if
labels
is
not
None
:
use_cache
=
False
use_cache
=
False
if
decoder_input_ids
is
None
:
if
decoder_input_ids
is
None
and
decoder_inputs_embeds
is
None
:
decoder_input_ids
=
shift_tokens_right
(
decoder_input_ids
=
shift_tokens_right
(
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
labels
,
self
.
config
.
pad_token_id
,
self
.
config
.
decoder_start_token_id
)
)
...
...
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment