Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
norm
vllm
Commits
3d1cfbfc
Unverified
Commit
3d1cfbfc
authored
Dec 16, 2023
by
Woosuk Kwon
Committed by
GitHub
Dec 16, 2023
Browse files
[Minor] Delete Llama tokenizer warnings (#2146)
parent
37ca5581
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
0 additions
and
17 deletions
+0
-17
vllm/transformers_utils/tokenizer.py
vllm/transformers_utils/tokenizer.py
+0
-17
No files found.
vllm/transformers_utils/tokenizer.py
View file @
3d1cfbfc
...
@@ -8,9 +8,6 @@ from vllm.transformers_utils.tokenizers import *
...
@@ -8,9 +8,6 @@ from vllm.transformers_utils.tokenizers import *
logger
=
init_logger
(
__name__
)
logger
=
init_logger
(
__name__
)
# A fast LLaMA tokenizer with the pre-processed `tokenizer.json` file.
_FAST_LLAMA_TOKENIZER
=
"hf-internal-testing/llama-tokenizer"
def
get_tokenizer
(
def
get_tokenizer
(
tokenizer_name
:
str
,
tokenizer_name
:
str
,
...
@@ -27,13 +24,6 @@ def get_tokenizer(
...
@@ -27,13 +24,6 @@ def get_tokenizer(
"Cannot use the fast tokenizer in slow tokenizer mode."
)
"Cannot use the fast tokenizer in slow tokenizer mode."
)
kwargs
[
"use_fast"
]
=
False
kwargs
[
"use_fast"
]
=
False
if
(
"llama"
in
tokenizer_name
.
lower
()
and
kwargs
.
get
(
"use_fast"
,
True
)
and
tokenizer_name
!=
_FAST_LLAMA_TOKENIZER
):
logger
.
info
(
"For some LLaMA V1 models, initializing the fast tokenizer may "
"take a long time. To reduce the initialization time, consider "
f
"using '
{
_FAST_LLAMA_TOKENIZER
}
' instead of the original "
"tokenizer."
)
try
:
try
:
tokenizer
=
AutoTokenizer
.
from_pretrained
(
tokenizer
=
AutoTokenizer
.
from_pretrained
(
tokenizer_name
,
tokenizer_name
,
...
@@ -41,13 +31,6 @@ def get_tokenizer(
...
@@ -41,13 +31,6 @@ def get_tokenizer(
trust_remote_code
=
trust_remote_code
,
trust_remote_code
=
trust_remote_code
,
tokenizer_revision
=
tokenizer_revision
,
tokenizer_revision
=
tokenizer_revision
,
**
kwargs
)
**
kwargs
)
except
TypeError
as
e
:
# The LLaMA tokenizer causes a protobuf error in some environments.
err_msg
=
(
"Failed to load the tokenizer. If you are using a LLaMA V1 model "
f
"consider using '
{
_FAST_LLAMA_TOKENIZER
}
' instead of the "
"original tokenizer."
)
raise
RuntimeError
(
err_msg
)
from
e
except
ValueError
as
e
:
except
ValueError
as
e
:
# If the error pertains to the tokenizer class not existing or not
# If the error pertains to the tokenizer class not existing or not
# currently being imported, suggest using the --trust-remote-code flag.
# currently being imported, suggest using the --trust-remote-code flag.
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment