Commit 8a22165b authored by Chen Chen's avatar Chen Chen Committed by A. Unique TensorFlower
Browse files

Internal change

PiperOrigin-RevId: 304556292
parent 8bf2b3be
...@@ -184,9 +184,15 @@ def create_float_feature(values): ...@@ -184,9 +184,15 @@ def create_float_feature(values):
return feature return feature
def create_training_instances(input_files, tokenizer, max_seq_length, def create_training_instances(input_files,
dupe_factor, short_seq_prob, masked_lm_prob, tokenizer,
max_predictions_per_seq, rng, do_whole_word_mask): max_seq_length,
dupe_factor,
short_seq_prob,
masked_lm_prob,
max_predictions_per_seq,
rng,
do_whole_word_mask=False):
"""Create `TrainingInstance`s from raw text.""" """Create `TrainingInstance`s from raw text."""
all_documents = [[]] all_documents = [[]]
...@@ -232,7 +238,7 @@ def create_training_instances(input_files, tokenizer, max_seq_length, ...@@ -232,7 +238,7 @@ def create_training_instances(input_files, tokenizer, max_seq_length,
def create_instances_from_document( def create_instances_from_document(
all_documents, document_index, max_seq_length, short_seq_prob, all_documents, document_index, max_seq_length, short_seq_prob,
masked_lm_prob, max_predictions_per_seq, vocab_words, rng, masked_lm_prob, max_predictions_per_seq, vocab_words, rng,
do_whole_word_mask): do_whole_word_mask=False):
"""Creates `TrainingInstance`s for a single document.""" """Creates `TrainingInstance`s for a single document."""
document = all_documents[document_index] document = all_documents[document_index]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment