Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
chenpangpang
transformers
Commits
c6acbdd5
"vscode:/vscode.git/clone" did not exist on "439fac723a99b668d168f32e3c1265463687b9be"
Commit
c6acbdd5
authored
Sep 27, 2019
by
Julien Chaumond
Browse files
Close #1304
parent
df7cd9e4
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
2 additions
and
0 deletions
+2
-0
transformers/tokenization_roberta.py
transformers/tokenization_roberta.py
+2
-0
No files found.
transformers/tokenization_roberta.py
View file @
c6acbdd5
...
@@ -81,6 +81,8 @@ class RobertaTokenizer(GPT2Tokenizer):
...
@@ -81,6 +81,8 @@ class RobertaTokenizer(GPT2Tokenizer):
bos_token
=
bos_token
,
eos_token
=
eos_token
,
unk_token
=
unk_token
,
bos_token
=
bos_token
,
eos_token
=
eos_token
,
unk_token
=
unk_token
,
sep_token
=
sep_token
,
cls_token
=
cls_token
,
pad_token
=
pad_token
,
sep_token
=
sep_token
,
cls_token
=
cls_token
,
pad_token
=
pad_token
,
mask_token
=
mask_token
,
**
kwargs
)
mask_token
=
mask_token
,
**
kwargs
)
self
.
max_len_single_sentence
=
self
.
max_len
-
2
# take into account special tokens
self
.
max_len_sentences_pair
=
self
.
max_len
-
4
# take into account special tokens
def
add_special_tokens_single_sequence
(
self
,
token_ids
):
def
add_special_tokens_single_sequence
(
self
,
token_ids
):
"""
"""
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment