Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
chenpangpang
transformers
Commits
b97cab7e
Unverified
Commit
b97cab7e
authored
Nov 13, 2023
by
Arthur
Committed by
GitHub
Nov 13, 2023
Browse files
Remove-auth-token (#27060)
* don't use `use_auth_token`internally * let's use token everywhere * fixup
parent
8f577dca
Changes
29
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
56 additions
and
58 deletions
+56
-58
docs/source/en/hpo_train.md
docs/source/en/hpo_train.md
+1
-1
docs/source/en/model_doc/nllb.md
docs/source/en/model_doc/nllb.md
+2
-2
docs/source/ja/hpo_train.md
docs/source/ja/hpo_train.md
+1
-1
docs/source/ko/hpo_train.md
docs/source/ko/hpo_train.md
+1
-1
examples/research_projects/jax-projects/README.md
examples/research_projects/jax-projects/README.md
+1
-1
examples/research_projects/layoutlmv3/run_funsd_cord.py
examples/research_projects/layoutlmv3/run_funsd_cord.py
+5
-5
examples/research_projects/mlm_wwm/run_mlm_wwm.py
examples/research_projects/mlm_wwm/run_mlm_wwm.py
+1
-1
examples/research_projects/quantization-qdqbert/run_quant_qa.py
...es/research_projects/quantization-qdqbert/run_quant_qa.py
+3
-3
examples/research_projects/robust-speech-event/eval.py
examples/research_projects/robust-speech-event/eval.py
+1
-1
examples/research_projects/robust-speech-event/run_speech_recognition_ctc_bnb.py
...cts/robust-speech-event/run_speech_recognition_ctc_bnb.py
+6
-6
examples/research_projects/robust-speech-event/run_speech_recognition_ctc_streaming.py
...bust-speech-event/run_speech_recognition_ctc_streaming.py
+6
-6
examples/research_projects/tapex/run_tabfact_with_tapex.py
examples/research_projects/tapex/run_tabfact_with_tapex.py
+3
-3
examples/research_projects/tapex/run_wikisql_with_tapex.py
examples/research_projects/tapex/run_wikisql_with_tapex.py
+3
-3
examples/research_projects/tapex/run_wikitablequestions_with_tapex.py
...earch_projects/tapex/run_wikitablequestions_with_tapex.py
+3
-3
examples/research_projects/xtreme-s/run_xtreme_s.py
examples/research_projects/xtreme-s/run_xtreme_s.py
+9
-9
src/transformers/generation/configuration_utils.py
src/transformers/generation/configuration_utils.py
+1
-1
src/transformers/integrations/peft.py
src/transformers/integrations/peft.py
+2
-2
src/transformers/models/bark/processing_bark.py
src/transformers/models/bark/processing_bark.py
+2
-2
src/transformers/tools/base.py
src/transformers/tools/base.py
+3
-3
tests/models/auto/test_processor_auto.py
tests/models/auto/test_processor_auto.py
+2
-4
No files found.
docs/source/en/hpo_train.md
View file @
b97cab7e
...
@@ -99,7 +99,7 @@ Define a `model_init` function and pass it to the [`Trainer`], as an example:
...
@@ -99,7 +99,7 @@ Define a `model_init` function and pass it to the [`Trainer`], as an example:
...
config
=
config
,
...
config
=
config
,
...
cache_dir
=
model_args
.
cache_dir
,
...
cache_dir
=
model_args
.
cache_dir
,
...
revision
=
model_args
.
model_revision
,
...
revision
=
model_args
.
model_revision
,
...
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
...
token
=
True
if
model_args
.
use_auth_token
else
None
,
...
)
...
)
```
```
...
...
docs/source/en/model_doc/nllb.md
View file @
b97cab7e
...
@@ -118,9 +118,9 @@ See example below for a translation from romanian to german:
...
@@ -118,9 +118,9 @@ See example below for a translation from romanian to german:
>>> from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
>>> from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
>>> tokenizer = AutoTokenizer.from_pretrained(
>>> tokenizer = AutoTokenizer.from_pretrained(
... "facebook/nllb-200-distilled-600M",
use_auth_
token=True, src_lang="ron_Latn"
... "facebook/nllb-200-distilled-600M", token=True, src_lang="ron_Latn"
... )
... )
>>> model = AutoModelForSeq2SeqLM.from_pretrained("facebook/nllb-200-distilled-600M",
use_auth_
token=True)
>>> model = AutoModelForSeq2SeqLM.from_pretrained("facebook/nllb-200-distilled-600M", token=True)
>>> article = "Şeful ONU spune că nu există o soluţie militară în Siria"
>>> article = "Şeful ONU spune că nu există o soluţie militară în Siria"
>>> inputs = tokenizer(article, return_tensors="pt")
>>> inputs = tokenizer(article, return_tensors="pt")
...
...
docs/source/ja/hpo_train.md
View file @
b97cab7e
...
@@ -105,7 +105,7 @@ Wandbについては、[object_parameter](https://docs.wandb.ai/guides/sweeps/co
...
@@ -105,7 +105,7 @@ Wandbについては、[object_parameter](https://docs.wandb.ai/guides/sweeps/co
...
config
=
config
,
...
config
=
config
,
...
cache_dir
=
model_args
.
cache_dir
,
...
cache_dir
=
model_args
.
cache_dir
,
...
revision
=
model_args
.
model_revision
,
...
revision
=
model_args
.
model_revision
,
...
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
...
token
=
True
if
model_args
.
use_auth_token
else
None
,
...
)
...
)
```
```
...
...
docs/source/ko/hpo_train.md
View file @
b97cab7e
...
@@ -87,7 +87,7 @@ wandb의 경우, 해당 [object_parameter](https://docs.wandb.ai/guides/sweeps/c
...
@@ -87,7 +87,7 @@ wandb의 경우, 해당 [object_parameter](https://docs.wandb.ai/guides/sweeps/c
...
config
=
config
,
...
config
=
config
,
...
cache_dir
=
model_args
.
cache_dir
,
...
cache_dir
=
model_args
.
cache_dir
,
...
revision
=
model_args
.
model_revision
,
...
revision
=
model_args
.
model_revision
,
...
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
...
token
=
True
if
model_args
.
use_auth_token
else
None
,
...
)
...
)
```
```
...
...
examples/research_projects/jax-projects/README.md
View file @
b97cab7e
...
@@ -1117,7 +1117,7 @@ params = model.init(key2, x)
...
@@ -1117,7 +1117,7 @@ params = model.init(key2, x)
bytes_output
=
serialization
.
to_bytes
(
params
)
bytes_output
=
serialization
.
to_bytes
(
params
)
repo
=
Repository
(
"flax-model"
,
clone_from
=
"flax-community/flax-model-dummy"
,
use_auth_
token
=
True
)
repo
=
Repository
(
"flax-model"
,
clone_from
=
"flax-community/flax-model-dummy"
,
token
=
True
)
with
repo
.
commit
(
"My cool Flax model :)"
):
with
repo
.
commit
(
"My cool Flax model :)"
):
with
open
(
"flax_model.msgpack"
,
"wb"
)
as
f
:
with
open
(
"flax_model.msgpack"
,
"wb"
)
as
f
:
f
.
write
(
bytes_output
)
f
.
write
(
bytes_output
)
...
...
examples/research_projects/layoutlmv3/run_funsd_cord.py
View file @
b97cab7e
...
@@ -250,7 +250,7 @@ def main():
...
@@ -250,7 +250,7 @@ def main():
"nielsr/funsd-layoutlmv3"
,
"nielsr/funsd-layoutlmv3"
,
data_args
.
dataset_config_name
,
data_args
.
dataset_config_name
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
elif
data_args
.
dataset_name
==
"cord"
:
elif
data_args
.
dataset_name
==
"cord"
:
# Downloading and loading a dataset from the hub.
# Downloading and loading a dataset from the hub.
...
@@ -258,7 +258,7 @@ def main():
...
@@ -258,7 +258,7 @@ def main():
"nielsr/cord-layoutlmv3"
,
"nielsr/cord-layoutlmv3"
,
data_args
.
dataset_config_name
,
data_args
.
dataset_config_name
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
else
:
else
:
raise
ValueError
(
"This script only supports either FUNSD or CORD out-of-the-box."
)
raise
ValueError
(
"This script only supports either FUNSD or CORD out-of-the-box."
)
...
@@ -313,7 +313,7 @@ def main():
...
@@ -313,7 +313,7 @@ def main():
finetuning_task
=
data_args
.
task_name
,
finetuning_task
=
data_args
.
task_name
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
processor
=
AutoProcessor
.
from_pretrained
(
processor
=
AutoProcessor
.
from_pretrained
(
...
@@ -321,7 +321,7 @@ def main():
...
@@ -321,7 +321,7 @@ def main():
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
use_fast
=
True
,
use_fast
=
True
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
add_prefix_space
=
True
,
add_prefix_space
=
True
,
apply_ocr
=
False
,
apply_ocr
=
False
,
)
)
...
@@ -332,7 +332,7 @@ def main():
...
@@ -332,7 +332,7 @@ def main():
config
=
config
,
config
=
config
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
# Set the correspondences label/ID inside the model config
# Set the correspondences label/ID inside the model config
...
...
examples/research_projects/mlm_wwm/run_mlm_wwm.py
View file @
b97cab7e
...
@@ -325,7 +325,7 @@ def main():
...
@@ -325,7 +325,7 @@ def main():
config
=
config
,
config
=
config
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
else
:
else
:
logger
.
info
(
"Training new model from scratch"
)
logger
.
info
(
"Training new model from scratch"
)
...
...
examples/research_projects/quantization-qdqbert/run_quant_qa.py
View file @
b97cab7e
...
@@ -322,14 +322,14 @@ def main():
...
@@ -322,14 +322,14 @@ def main():
model_args
.
config_name
if
model_args
.
config_name
else
model_args
.
model_name_or_path
,
model_args
.
config_name
if
model_args
.
config_name
else
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
tokenizer
=
AutoTokenizer
.
from_pretrained
(
tokenizer
=
AutoTokenizer
.
from_pretrained
(
model_args
.
tokenizer_name
if
model_args
.
tokenizer_name
else
model_args
.
model_name_or_path
,
model_args
.
tokenizer_name
if
model_args
.
tokenizer_name
else
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
use_fast
=
True
,
use_fast
=
True
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
model
=
QDQBertForQuestionAnswering
.
from_pretrained
(
model
=
QDQBertForQuestionAnswering
.
from_pretrained
(
model_args
.
model_name_or_path
,
model_args
.
model_name_or_path
,
...
@@ -337,7 +337,7 @@ def main():
...
@@ -337,7 +337,7 @@ def main():
config
=
config
,
config
=
config
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
# Tokenizer check: this script requires a fast tokenizer.
# Tokenizer check: this script requires a fast tokenizer.
...
...
examples/research_projects/robust-speech-event/eval.py
View file @
b97cab7e
...
@@ -65,7 +65,7 @@ def normalize_text(text: str) -> str:
...
@@ -65,7 +65,7 @@ def normalize_text(text: str) -> str:
def
main
(
args
):
def
main
(
args
):
# load dataset
# load dataset
dataset
=
load_dataset
(
args
.
dataset
,
args
.
config
,
split
=
args
.
split
,
use_auth_
token
=
True
)
dataset
=
load_dataset
(
args
.
dataset
,
args
.
config
,
split
=
args
.
split
,
token
=
True
)
# for testing: only process the first two examples as a test
# for testing: only process the first two examples as a test
# dataset = dataset.select(range(10))
# dataset = dataset.select(range(10))
...
...
examples/research_projects/robust-speech-event/run_speech_recognition_ctc_bnb.py
View file @
b97cab7e
...
@@ -418,7 +418,7 @@ def main():
...
@@ -418,7 +418,7 @@ def main():
data_args
.
dataset_name
,
data_args
.
dataset_name
,
data_args
.
dataset_config_name
,
data_args
.
dataset_config_name
,
split
=
data_args
.
train_split_name
,
split
=
data_args
.
train_split_name
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
)
)
if
data_args
.
audio_column_name
not
in
raw_datasets
[
"train"
].
column_names
:
if
data_args
.
audio_column_name
not
in
raw_datasets
[
"train"
].
column_names
:
...
@@ -443,7 +443,7 @@ def main():
...
@@ -443,7 +443,7 @@ def main():
data_args
.
dataset_name
,
data_args
.
dataset_name
,
data_args
.
dataset_config_name
,
data_args
.
dataset_config_name
,
split
=
data_args
.
eval_split_name
,
split
=
data_args
.
eval_split_name
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
)
)
if
data_args
.
max_eval_samples
is
not
None
:
if
data_args
.
max_eval_samples
is
not
None
:
...
@@ -481,7 +481,7 @@ def main():
...
@@ -481,7 +481,7 @@ def main():
# the tokenizer
# the tokenizer
# load config
# load config
config
=
AutoConfig
.
from_pretrained
(
config
=
AutoConfig
.
from_pretrained
(
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
use_auth_
token
=
data_args
.
use_auth_token
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
token
=
data_args
.
use_auth_token
)
)
# 4. Next, if no tokenizer file is defined,
# 4. Next, if no tokenizer file is defined,
...
@@ -532,11 +532,11 @@ def main():
...
@@ -532,11 +532,11 @@ def main():
# load feature_extractor and tokenizer
# load feature_extractor and tokenizer
tokenizer
=
AutoTokenizer
.
from_pretrained
(
tokenizer
=
AutoTokenizer
.
from_pretrained
(
tokenizer_name_or_path
,
tokenizer_name_or_path
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
**
tokenizer_kwargs
,
**
tokenizer_kwargs
,
)
)
feature_extractor
=
AutoFeatureExtractor
.
from_pretrained
(
feature_extractor
=
AutoFeatureExtractor
.
from_pretrained
(
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
use_auth_
token
=
data_args
.
use_auth_token
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
token
=
data_args
.
use_auth_token
)
)
# adapt config
# adapt config
...
@@ -564,7 +564,7 @@ def main():
...
@@ -564,7 +564,7 @@ def main():
model_args
.
model_name_or_path
,
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
config
=
config
,
config
=
config
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
)
)
# freeze encoder
# freeze encoder
...
...
examples/research_projects/robust-speech-event/run_speech_recognition_ctc_streaming.py
View file @
b97cab7e
...
@@ -395,7 +395,7 @@ def main():
...
@@ -395,7 +395,7 @@ def main():
# so we just need to set the correct target sampling rate and normalize the input
# so we just need to set the correct target sampling rate and normalize the input
# via the `feature_extractor`
# via the `feature_extractor`
feature_extractor
=
AutoFeatureExtractor
.
from_pretrained
(
feature_extractor
=
AutoFeatureExtractor
.
from_pretrained
(
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
use_auth_
token
=
data_args
.
use_auth_token
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
token
=
data_args
.
use_auth_token
)
)
if
training_args
.
do_train
:
if
training_args
.
do_train
:
...
@@ -403,7 +403,7 @@ def main():
...
@@ -403,7 +403,7 @@ def main():
path
=
data_args
.
dataset_name
,
path
=
data_args
.
dataset_name
,
name
=
data_args
.
dataset_config_name
,
name
=
data_args
.
dataset_config_name
,
split
=
data_args
.
train_split_name
,
split
=
data_args
.
train_split_name
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
streaming
=
True
,
streaming
=
True
,
sampling_rate
=
feature_extractor
.
sampling_rate
,
sampling_rate
=
feature_extractor
.
sampling_rate
,
)
)
...
@@ -431,7 +431,7 @@ def main():
...
@@ -431,7 +431,7 @@ def main():
path
=
data_args
.
dataset_name
,
path
=
data_args
.
dataset_name
,
name
=
data_args
.
dataset_config_name
,
name
=
data_args
.
dataset_config_name
,
split
=
data_args
.
eval_split_name
,
split
=
data_args
.
eval_split_name
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
streaming
=
True
,
streaming
=
True
,
sampling_rate
=
feature_extractor
.
sampling_rate
,
sampling_rate
=
feature_extractor
.
sampling_rate
,
)
)
...
@@ -465,7 +465,7 @@ def main():
...
@@ -465,7 +465,7 @@ def main():
# 3. Next, let's load the config as we might need it to create
# 3. Next, let's load the config as we might need it to create
# the tokenizer
# the tokenizer
config
=
AutoConfig
.
from_pretrained
(
config
=
AutoConfig
.
from_pretrained
(
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
use_auth_
token
=
data_args
.
use_auth_token
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
token
=
data_args
.
use_auth_token
)
)
# 4. Now we can instantiate the tokenizer and model
# 4. Now we can instantiate the tokenizer and model
...
@@ -481,7 +481,7 @@ def main():
...
@@ -481,7 +481,7 @@ def main():
tokenizer
=
AutoTokenizer
.
from_pretrained
(
tokenizer
=
AutoTokenizer
.
from_pretrained
(
tokenizer_name_or_path
,
tokenizer_name_or_path
,
config
=
config
,
config
=
config
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
)
)
# adapt config
# adapt config
...
@@ -509,7 +509,7 @@ def main():
...
@@ -509,7 +509,7 @@ def main():
model_args
.
model_name_or_path
,
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
config
=
config
,
config
=
config
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
)
)
# freeze encoder
# freeze encoder
...
...
examples/research_projects/tapex/run_tabfact_with_tapex.py
View file @
b97cab7e
...
@@ -292,7 +292,7 @@ def main():
...
@@ -292,7 +292,7 @@ def main():
num_labels
=
num_labels
,
num_labels
=
num_labels
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
# load tapex tokenizer
# load tapex tokenizer
tokenizer
=
TapexTokenizer
.
from_pretrained
(
tokenizer
=
TapexTokenizer
.
from_pretrained
(
...
@@ -300,7 +300,7 @@ def main():
...
@@ -300,7 +300,7 @@ def main():
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
use_fast
=
model_args
.
use_fast_tokenizer
,
use_fast
=
model_args
.
use_fast_tokenizer
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
add_prefix_space
=
True
,
add_prefix_space
=
True
,
)
)
model
=
BartForSequenceClassification
.
from_pretrained
(
model
=
BartForSequenceClassification
.
from_pretrained
(
...
@@ -309,7 +309,7 @@ def main():
...
@@ -309,7 +309,7 @@ def main():
config
=
config
,
config
=
config
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
# Padding strategy
# Padding strategy
...
...
examples/research_projects/tapex/run_wikisql_with_tapex.py
View file @
b97cab7e
...
@@ -329,7 +329,7 @@ def main():
...
@@ -329,7 +329,7 @@ def main():
model_args
.
config_name
if
model_args
.
config_name
else
model_args
.
model_name_or_path
,
model_args
.
config_name
if
model_args
.
config_name
else
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
# IMPORTANT: the initial BART model's decoding is penalized by no_repeat_ngram_size, and thus
# IMPORTANT: the initial BART model's decoding is penalized by no_repeat_ngram_size, and thus
...
@@ -344,7 +344,7 @@ def main():
...
@@ -344,7 +344,7 @@ def main():
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
use_fast
=
model_args
.
use_fast_tokenizer
,
use_fast
=
model_args
.
use_fast_tokenizer
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
add_prefix_space
=
True
,
add_prefix_space
=
True
,
)
)
...
@@ -355,7 +355,7 @@ def main():
...
@@ -355,7 +355,7 @@ def main():
config
=
config
,
config
=
config
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
if
model
.
config
.
decoder_start_token_id
is
None
:
if
model
.
config
.
decoder_start_token_id
is
None
:
...
...
examples/research_projects/tapex/run_wikitablequestions_with_tapex.py
View file @
b97cab7e
...
@@ -327,7 +327,7 @@ def main():
...
@@ -327,7 +327,7 @@ def main():
model_args
.
config_name
if
model_args
.
config_name
else
model_args
.
model_name_or_path
,
model_args
.
config_name
if
model_args
.
config_name
else
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
# IMPORTANT: the initial BART model's decoding is penalized by no_repeat_ngram_size, and thus
# IMPORTANT: the initial BART model's decoding is penalized by no_repeat_ngram_size, and thus
...
@@ -342,7 +342,7 @@ def main():
...
@@ -342,7 +342,7 @@ def main():
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
use_fast
=
model_args
.
use_fast_tokenizer
,
use_fast
=
model_args
.
use_fast_tokenizer
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
add_prefix_space
=
True
,
add_prefix_space
=
True
,
)
)
...
@@ -353,7 +353,7 @@ def main():
...
@@ -353,7 +353,7 @@ def main():
config
=
config
,
config
=
config
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
revision
=
model_args
.
model_revision
,
revision
=
model_args
.
model_revision
,
use_auth_
token
=
True
if
model_args
.
use_auth_token
else
None
,
token
=
True
if
model_args
.
use_auth_token
else
None
,
)
)
if
model
.
config
.
decoder_start_token_id
is
None
:
if
model
.
config
.
decoder_start_token_id
is
None
:
...
...
examples/research_projects/xtreme-s/run_xtreme_s.py
View file @
b97cab7e
...
@@ -502,7 +502,7 @@ def main():
...
@@ -502,7 +502,7 @@ def main():
data_args
.
dataset_name
,
data_args
.
dataset_name
,
config_name
,
config_name
,
split
=
data_args
.
train_split_name
,
split
=
data_args
.
train_split_name
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
)
)
...
@@ -528,7 +528,7 @@ def main():
...
@@ -528,7 +528,7 @@ def main():
data_args
.
dataset_name
,
data_args
.
dataset_name
,
config_name
,
config_name
,
split
=
data_args
.
eval_split_name
,
split
=
data_args
.
eval_split_name
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
)
)
...
@@ -540,7 +540,7 @@ def main():
...
@@ -540,7 +540,7 @@ def main():
data_args
.
dataset_name
,
data_args
.
dataset_name
,
config_name
,
config_name
,
split
=
data_args
.
predict_split_name
,
split
=
data_args
.
predict_split_name
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
)
)
...
@@ -595,7 +595,7 @@ def main():
...
@@ -595,7 +595,7 @@ def main():
# 3. Next, let's load the config as we might need it to create
# 3. Next, let's load the config as we might need it to create
# the tokenizer
# the tokenizer
config
=
AutoConfig
.
from_pretrained
(
config
=
AutoConfig
.
from_pretrained
(
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
use_auth_
token
=
data_args
.
use_auth_token
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
token
=
data_args
.
use_auth_token
)
)
if
is_text_target
:
if
is_text_target
:
...
@@ -651,11 +651,11 @@ def main():
...
@@ -651,11 +651,11 @@ def main():
if
is_text_target
:
if
is_text_target
:
tokenizer
=
AutoTokenizer
.
from_pretrained
(
tokenizer
=
AutoTokenizer
.
from_pretrained
(
tokenizer_name_or_path
,
tokenizer_name_or_path
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
**
tokenizer_kwargs
,
**
tokenizer_kwargs
,
)
)
feature_extractor
=
AutoFeatureExtractor
.
from_pretrained
(
feature_extractor
=
AutoFeatureExtractor
.
from_pretrained
(
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
use_auth_
token
=
data_args
.
use_auth_token
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
token
=
data_args
.
use_auth_token
)
)
# adapt config
# adapt config
...
@@ -694,14 +694,14 @@ def main():
...
@@ -694,14 +694,14 @@ def main():
model_args
.
model_name_or_path
,
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
config
=
config
,
config
=
config
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
)
)
elif
config
.
is_encoder_decoder
:
elif
config
.
is_encoder_decoder
:
model
=
AutoModelForSpeechSeq2Seq
.
from_pretrained
(
model
=
AutoModelForSpeechSeq2Seq
.
from_pretrained
(
model_args
.
model_name_or_path
,
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
config
=
config
,
config
=
config
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
)
)
if
model
.
config
.
decoder_start_token_id
is
None
:
if
model
.
config
.
decoder_start_token_id
is
None
:
raise
ValueError
(
"Make sure that `config.decoder_start_token_id` is correctly defined"
)
raise
ValueError
(
"Make sure that `config.decoder_start_token_id` is correctly defined"
)
...
@@ -710,7 +710,7 @@ def main():
...
@@ -710,7 +710,7 @@ def main():
model_args
.
model_name_or_path
,
model_args
.
model_name_or_path
,
cache_dir
=
model_args
.
cache_dir
,
cache_dir
=
model_args
.
cache_dir
,
config
=
config
,
config
=
config
,
use_auth_
token
=
data_args
.
use_auth_token
,
token
=
data_args
.
use_auth_token
,
)
)
# freeze encoder
# freeze encoder
...
...
src/transformers/generation/configuration_utils.py
View file @
b97cab7e
...
@@ -716,7 +716,7 @@ class GenerationConfig(PushToHubMixin):
...
@@ -716,7 +716,7 @@ class GenerationConfig(PushToHubMixin):
proxies
=
proxies
,
proxies
=
proxies
,
resume_download
=
resume_download
,
resume_download
=
resume_download
,
local_files_only
=
local_files_only
,
local_files_only
=
local_files_only
,
use_auth_
token
=
token
,
token
=
token
,
user_agent
=
user_agent
,
user_agent
=
user_agent
,
revision
=
revision
,
revision
=
revision
,
subfolder
=
subfolder
,
subfolder
=
subfolder
,
...
...
src/transformers/integrations/peft.py
View file @
b97cab7e
...
@@ -179,7 +179,7 @@ class PeftAdapterMixin:
...
@@ -179,7 +179,7 @@ class PeftAdapterMixin:
peft_config
=
PeftConfig
.
from_pretrained
(
peft_config
=
PeftConfig
.
from_pretrained
(
peft_model_id
,
peft_model_id
,
use_auth_
token
=
token
,
token
=
token
,
**
adapter_kwargs
,
**
adapter_kwargs
,
)
)
...
@@ -190,7 +190,7 @@ class PeftAdapterMixin:
...
@@ -190,7 +190,7 @@ class PeftAdapterMixin:
self
.
_hf_peft_config_loaded
=
True
self
.
_hf_peft_config_loaded
=
True
if
peft_model_id
is
not
None
:
if
peft_model_id
is
not
None
:
adapter_state_dict
=
load_peft_weights
(
peft_model_id
,
use_auth_
token
=
token
,
**
adapter_kwargs
)
adapter_state_dict
=
load_peft_weights
(
peft_model_id
,
token
=
token
,
**
adapter_kwargs
)
# We need to pre-process the state dict to remove unneeded prefixes - for backward compatibility
# We need to pre-process the state dict to remove unneeded prefixes - for backward compatibility
processed_adapter_state_dict
=
{}
processed_adapter_state_dict
=
{}
...
...
src/transformers/models/bark/processing_bark.py
View file @
b97cab7e
...
@@ -94,7 +94,7 @@ class BarkProcessor(ProcessorMixin):
...
@@ -94,7 +94,7 @@ class BarkProcessor(ProcessorMixin):
proxies
=
kwargs
.
pop
(
"proxies"
,
None
),
proxies
=
kwargs
.
pop
(
"proxies"
,
None
),
resume_download
=
kwargs
.
pop
(
"resume_download"
,
False
),
resume_download
=
kwargs
.
pop
(
"resume_download"
,
False
),
local_files_only
=
kwargs
.
pop
(
"local_files_only"
,
False
),
local_files_only
=
kwargs
.
pop
(
"local_files_only"
,
False
),
use_auth_
token
=
kwargs
.
pop
(
"use_auth_token"
,
None
),
token
=
kwargs
.
pop
(
"use_auth_token"
,
None
),
revision
=
kwargs
.
pop
(
"revision"
,
None
),
revision
=
kwargs
.
pop
(
"revision"
,
None
),
)
)
if
speaker_embeddings_path
is
None
:
if
speaker_embeddings_path
is
None
:
...
@@ -190,7 +190,7 @@ class BarkProcessor(ProcessorMixin):
...
@@ -190,7 +190,7 @@ class BarkProcessor(ProcessorMixin):
proxies
=
kwargs
.
pop
(
"proxies"
,
None
),
proxies
=
kwargs
.
pop
(
"proxies"
,
None
),
resume_download
=
kwargs
.
pop
(
"resume_download"
,
False
),
resume_download
=
kwargs
.
pop
(
"resume_download"
,
False
),
local_files_only
=
kwargs
.
pop
(
"local_files_only"
,
False
),
local_files_only
=
kwargs
.
pop
(
"local_files_only"
,
False
),
use_auth_
token
=
kwargs
.
pop
(
"use_auth_token"
,
None
),
token
=
kwargs
.
pop
(
"use_auth_token"
,
None
),
revision
=
kwargs
.
pop
(
"revision"
,
None
),
revision
=
kwargs
.
pop
(
"revision"
,
None
),
)
)
if
path
is
None
:
if
path
is
None
:
...
...
src/transformers/tools/base.py
View file @
b97cab7e
...
@@ -226,7 +226,7 @@ class Tool:
...
@@ -226,7 +226,7 @@ class Tool:
resolved_config_file
=
cached_file
(
resolved_config_file
=
cached_file
(
repo_id
,
repo_id
,
TOOL_CONFIG_FILE
,
TOOL_CONFIG_FILE
,
use_auth_
token
=
token
,
token
=
token
,
**
hub_kwargs
,
**
hub_kwargs
,
_raise_exceptions_for_missing_entries
=
False
,
_raise_exceptions_for_missing_entries
=
False
,
_raise_exceptions_for_connection_errors
=
False
,
_raise_exceptions_for_connection_errors
=
False
,
...
@@ -236,7 +236,7 @@ class Tool:
...
@@ -236,7 +236,7 @@ class Tool:
resolved_config_file
=
cached_file
(
resolved_config_file
=
cached_file
(
repo_id
,
repo_id
,
CONFIG_NAME
,
CONFIG_NAME
,
use_auth_
token
=
token
,
token
=
token
,
**
hub_kwargs
,
**
hub_kwargs
,
_raise_exceptions_for_missing_entries
=
False
,
_raise_exceptions_for_missing_entries
=
False
,
_raise_exceptions_for_connection_errors
=
False
,
_raise_exceptions_for_connection_errors
=
False
,
...
@@ -259,7 +259,7 @@ class Tool:
...
@@ -259,7 +259,7 @@ class Tool:
custom_tool
=
config
custom_tool
=
config
tool_class
=
custom_tool
[
"tool_class"
]
tool_class
=
custom_tool
[
"tool_class"
]
tool_class
=
get_class_from_dynamic_module
(
tool_class
,
repo_id
,
use_auth_
token
=
token
,
**
hub_kwargs
)
tool_class
=
get_class_from_dynamic_module
(
tool_class
,
repo_id
,
token
=
token
,
**
hub_kwargs
)
if
len
(
tool_class
.
name
)
==
0
:
if
len
(
tool_class
.
name
)
==
0
:
tool_class
.
name
=
custom_tool
[
"name"
]
tool_class
.
name
=
custom_tool
[
"name"
]
...
...
tests/models/auto/test_processor_auto.py
View file @
b97cab7e
...
@@ -308,9 +308,7 @@ class ProcessorPushToHubTester(unittest.TestCase):
...
@@ -308,9 +308,7 @@ class ProcessorPushToHubTester(unittest.TestCase):
def
test_push_to_hub
(
self
):
def
test_push_to_hub
(
self
):
processor
=
Wav2Vec2Processor
.
from_pretrained
(
SAMPLE_PROCESSOR_CONFIG_DIR
)
processor
=
Wav2Vec2Processor
.
from_pretrained
(
SAMPLE_PROCESSOR_CONFIG_DIR
)
with
tempfile
.
TemporaryDirectory
()
as
tmp_dir
:
with
tempfile
.
TemporaryDirectory
()
as
tmp_dir
:
processor
.
save_pretrained
(
processor
.
save_pretrained
(
os
.
path
.
join
(
tmp_dir
,
"test-processor"
),
push_to_hub
=
True
,
token
=
self
.
_token
)
os
.
path
.
join
(
tmp_dir
,
"test-processor"
),
push_to_hub
=
True
,
use_auth_token
=
self
.
_token
)
new_processor
=
Wav2Vec2Processor
.
from_pretrained
(
f
"
{
USER
}
/test-processor"
)
new_processor
=
Wav2Vec2Processor
.
from_pretrained
(
f
"
{
USER
}
/test-processor"
)
for
k
,
v
in
processor
.
feature_extractor
.
__dict__
.
items
():
for
k
,
v
in
processor
.
feature_extractor
.
__dict__
.
items
():
...
@@ -324,7 +322,7 @@ class ProcessorPushToHubTester(unittest.TestCase):
...
@@ -324,7 +322,7 @@ class ProcessorPushToHubTester(unittest.TestCase):
processor
.
save_pretrained
(
processor
.
save_pretrained
(
os
.
path
.
join
(
tmp_dir
,
"test-processor-org"
),
os
.
path
.
join
(
tmp_dir
,
"test-processor-org"
),
push_to_hub
=
True
,
push_to_hub
=
True
,
use_auth_
token
=
self
.
_token
,
token
=
self
.
_token
,
organization
=
"valid_org"
,
organization
=
"valid_org"
,
)
)
...
...
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment