Unverified Commit 8fcb6935 authored by Sylvain Gugger's avatar Sylvain Gugger Committed by GitHub
Browse files

Fix DataCollatorForLanguageModeling (#8621)

parent f6fe41c9
......@@ -261,7 +261,7 @@ class DataCollatorForLanguageModeling:
batch["input_ids"], special_tokens_mask=special_tokens_mask
)
else:
labels = batch["input_ids"]
labels = batch["input_ids"].clone()
if self.tokenizer.pad_token_id is not None:
labels[labels == self.tokenizer.pad_token_id] = -100
batch["labels"] = labels
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment