Unverified Commit 6e6da5e4 authored by Arthur's avatar Arthur Committed by GitHub
Browse files

[`LlamaTokenizer`] make unk_token_length a property (#25689)

make unk_token_length a property
parent b85b8806
......@@ -154,7 +154,10 @@ class LlamaTokenizer(PreTrainedTokenizer):
self.use_default_system_prompt = use_default_system_prompt
self.sp_model = self.get_spm_processor()
self.unk_token_length = len(self.sp_model.encode(str(self.unk_token)))
@property
def unk_token_length(self):
return len(self.sp_model.encode(str(self.unk_token)))
# Copied from transformers.models.t5.tokenization_t5.T5Tokenizer.get_spm_processor
def get_spm_processor(self):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment