Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
chenpangpang
transformers
Commits
e9eeedaf
Unverified
Commit
e9eeedaf
authored
Jul 10, 2024
by
yukionfire
Committed by
GitHub
Jul 10, 2024
Browse files
remove duplicate words in msg (#31876)
parent
97aa3e29
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
3 additions
and
3 deletions
+3
-3
examples/flax/language-modeling/run_bart_dlm_flax.py
examples/flax/language-modeling/run_bart_dlm_flax.py
+1
-1
examples/research_projects/codeparrot/scripts/arguments.py
examples/research_projects/codeparrot/scripts/arguments.py
+1
-1
src/transformers/models/whisper/convert_openai_to_hf.py
src/transformers/models/whisper/convert_openai_to_hf.py
+1
-1
No files found.
examples/flax/language-modeling/run_bart_dlm_flax.py
View file @
e9eeedaf
...
@@ -290,7 +290,7 @@ class FlaxDataCollatorForBartDenoisingLM:
...
@@ -290,7 +290,7 @@ class FlaxDataCollatorForBartDenoisingLM:
def
__post_init__
(
self
):
def
__post_init__
(
self
):
if
self
.
tokenizer
.
mask_token
is
None
or
self
.
tokenizer
.
eos_token
is
None
:
if
self
.
tokenizer
.
mask_token
is
None
or
self
.
tokenizer
.
eos_token
is
None
:
raise
ValueError
(
raise
ValueError
(
"This tokenizer does not have a mask token or eos token
token
which is necessary for denoising"
"This tokenizer does not have a mask token or eos token which is necessary for denoising"
" language modeling. "
" language modeling. "
)
)
...
...
examples/research_projects/codeparrot/scripts/arguments.py
View file @
e9eeedaf
...
@@ -132,7 +132,7 @@ class PreprocessingArguments:
...
@@ -132,7 +132,7 @@ class PreprocessingArguments:
default
=
"transformersbook/codeparrot"
,
metadata
=
{
"help"
:
"Folder or name of dataset to process."
}
default
=
"transformersbook/codeparrot"
,
metadata
=
{
"help"
:
"Folder or name of dataset to process."
}
)
)
output_dir
:
Optional
[
str
]
=
field
(
output_dir
:
Optional
[
str
]
=
field
(
default
=
"codeparrot-clean"
,
metadata
=
{
"help"
:
"Folder to save processed
processed
dataset."
}
default
=
"codeparrot-clean"
,
metadata
=
{
"help"
:
"Folder to save processed dataset."
}
)
)
samples_per_file
:
Optional
[
int
]
=
field
(
samples_per_file
:
Optional
[
int
]
=
field
(
default
=
100_000
,
metadata
=
{
"help"
:
"Number of files to save per JSON output file."
}
default
=
100_000
,
metadata
=
{
"help"
:
"Number of files to save per JSON output file."
}
...
...
src/transformers/models/whisper/convert_openai_to_hf.py
View file @
e9eeedaf
...
@@ -176,7 +176,7 @@ def _download(url: str, root: str) -> Any:
...
@@ -176,7 +176,7 @@ def _download(url: str, root: str) -> Any:
model_bytes
=
open
(
download_target
,
"rb"
).
read
()
model_bytes
=
open
(
download_target
,
"rb"
).
read
()
if
insecure_hashlib
.
sha256
(
model_bytes
).
hexdigest
()
!=
expected_sha256
:
if
insecure_hashlib
.
sha256
(
model_bytes
).
hexdigest
()
!=
expected_sha256
:
raise
RuntimeError
(
raise
RuntimeError
(
"Model has been downloaded but the SHA256 checksum does not
not
match. Please retry loading the model."
"Model has been downloaded but the SHA256 checksum does not match. Please retry loading the model."
)
)
return
torch
.
load
(
io
.
BytesIO
(
model_bytes
))
return
torch
.
load
(
io
.
BytesIO
(
model_bytes
))
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment