Fix classification script: enable dynamic padding with truncation (#9554)

Co-authored-by: Pavel Tarashkevich <Pavel.Tarashkievich@orange.com>

Fix classification script: enable dynamic padding with truncation (#9554)
Co-authored-by: Pavel Tarashkevich <Pavel.Tarashkievich@orange.com>
27d0e01d · Pavel Tarashkevich · GitHub · 245cdb46 · 27d0e01d
Unverified Commit 27d0e01d authored Jan 13, 2021 by Pavel Tarashkevich Committed by GitHub Jan 13, 2021
Show whitespace changes
Inline Side-by-side

Showing with 1 addition and 3 deletions

examples/text-classification/run_glue.py examples/text-classification/run_glue.py +1 -3

No files found.
--- a/examples/text-classification/run_glue.py
+++ b/examples/text-classification/run_glue.py
@@ -283,11 +283,9 @@ def main():
    # Padding strategy
    if data_args.pad_to_max_length:
        padding = "max_length"
-        max_length = data_args.max_seq_length
    else:
        # We will pad later, dynamically at batch creation, to the max sequence length in each batch
        padding = False
-        max_length = None
    # Some models have set the order of the labels to use, so let's make sure we do use it.
    label_to_id = None
@@ -314,7 +312,7 @@ def main():
        args = (
            (examples[sentence1_key],) if sentence2_key is None else (examples[sentence1_key], examples[sentence2_key])
        )
-        result = tokenizer(*args, padding=padding, max_length=max_length, truncation=True)
+        result = tokenizer(*args, padding=padding, max_length=data_args.max_seq_length, truncation=True)
        # Map labels to IDs (not necessary for GLUE tasks)
        if label_to_id is not None and "label" in examples: