Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
chenpangpang
transformers
Commits
0cbddfb1
"tests/vscode:/vscode.git/clone" did not exist on "cb94ffb672b4ee6204fbfa44be540153acc26bb6"
Unverified
Commit
0cbddfb1
authored
May 24, 2021
by
Lysandre Debut
Committed by
GitHub
May 24, 2021
Browse files
Replace double occurrences as the last step (#11367)
parent
73fde1de
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
2 additions
and
2 deletions
+2
-2
src/transformers/convert_slow_tokenizer.py
src/transformers/convert_slow_tokenizer.py
+2
-2
No files found.
src/transformers/convert_slow_tokenizer.py
View file @
0cbddfb1
...
...
@@ -453,7 +453,6 @@ class AlbertConverter(SpmConverter):
list_normalizers
=
[
normalizers
.
Replace
(
"``"
,
'"'
),
normalizers
.
Replace
(
"''"
,
'"'
),
normalizers
.
Replace
(
Regex
(
" {2,}"
),
" "
),
]
if
not
self
.
original_tokenizer
.
keep_accents
:
list_normalizers
.
append
(
normalizers
.
NFKD
())
...
...
@@ -463,6 +462,7 @@ class AlbertConverter(SpmConverter):
precompiled_charsmap
=
proto
.
normalizer_spec
.
precompiled_charsmap
list_normalizers
.
append
(
normalizers
.
Precompiled
(
precompiled_charsmap
))
list_normalizers
.
append
(
normalizers
.
Replace
(
Regex
(
" {2,}"
),
" "
))
return
normalizers
.
Sequence
(
list_normalizers
)
def
post_processor
(
self
):
...
...
@@ -641,7 +641,6 @@ class XLNetConverter(SpmConverter):
list_normalizers
=
[
normalizers
.
Replace
(
"``"
,
'"'
),
normalizers
.
Replace
(
"''"
,
'"'
),
normalizers
.
Replace
(
Regex
(
" {2,}"
),
" "
),
]
if
not
self
.
original_tokenizer
.
keep_accents
:
list_normalizers
.
append
(
normalizers
.
NFKD
())
...
...
@@ -651,6 +650,7 @@ class XLNetConverter(SpmConverter):
precompiled_charsmap
=
proto
.
normalizer_spec
.
precompiled_charsmap
list_normalizers
.
append
(
normalizers
.
Precompiled
(
precompiled_charsmap
))
list_normalizers
.
append
(
normalizers
.
Replace
(
Regex
(
" {2,}"
),
" "
))
return
normalizers
.
Sequence
(
list_normalizers
)
def
post_processor
(
self
):
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment