"ppocr/git@developer.sourcefind.cn:wangsen/paddle_dbnet.git" did not exist on "5c4c418b7d7f55595a17e942d7b5027b2f93bb29"
Unverified Commit c4158a63 authored by Patrick von Platen's avatar Patrick von Platen Committed by GitHub
Browse files

[Pipelines] Encode to max length of input not max length of tokenizer for batch input (#3857)

* remove max_length = tokenizer.max_length when encoding

* make style
parent 857ccdb2
...@@ -425,11 +425,7 @@ class Pipeline(_ScikitCompat): ...@@ -425,11 +425,7 @@ class Pipeline(_ScikitCompat):
# Parse arguments # Parse arguments
inputs = self._args_parser(*texts, **kwargs) inputs = self._args_parser(*texts, **kwargs)
inputs = self.tokenizer.batch_encode_plus( inputs = self.tokenizer.batch_encode_plus(
inputs, inputs, add_special_tokens=True, return_tensors=self.framework, pad_to_max_length=pad_to_max_length,
add_special_tokens=True,
return_tensors=self.framework,
max_length=self.tokenizer.max_len,
pad_to_max_length=pad_to_max_length,
) )
return inputs return inputs
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment