fix param s=1 benchmark crash bug

8655cfb0 · huangwb · 25e8c688 · 8655cfb0
Commit 8655cfb0 authored Apr 30, 2024 by huangwb
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 0 deletions

server/text_generation_server/models/flash_causal_lm.py server/text_generation_server/models/flash_causal_lm.py +2 -0

No files found.
--- a/server/text_generation_server/models/flash_causal_lm.py
+++ b/server/text_generation_server/models/flash_causal_lm.py
@@ -169,11 +169,13 @@ class FlashCausalLMBatch(Batch):
            requests_idx_mapping[r.id] = i
            tokenized_input = tokenized_input[-r.truncate :]
+            '''fix input s=1 crash bug
            if (
                tokenized_input[0] == tokenizer.bos_token_id
                and tokenized_input[1] == tokenizer.bos_token_id
            ):
                tokenized_input = tokenized_input[1:]
+            '''
            input_length = len(tokenized_input)
            input_lengths.append(input_length)