Fixing linting on main. (#2719)

9fde5666 · Nicolas Patry · GitHub · aadc9cb4 · 9fde5666
Unverified Commit 9fde5666 authored Nov 04, 2024 by Nicolas Patry Committed by GitHub Nov 04, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 2 deletions

server/text_generation_server/models/flash_causal_lm.py server/text_generation_server/models/flash_causal_lm.py +4 -2

No files found.
--- a/server/text_generation_server/models/flash_causal_lm.py
+++ b/server/text_generation_server/models/flash_causal_lm.py
@@ -1729,9 +1729,11 @@ class FlashCausalLM(Model):
            # Slots can be discontiguous when prefix caching is enabled, so we need to expand the slot_indices,
            # then update the slots with the additional indices to ensure we're grabbing the ones that have been
            # allocated
-            slot_indices = (batch.slot_indices.unsqueeze(-1).expand(B, new_length) + arange_int).view(-1)
+            slot_indices = (
+                batch.slot_indices.unsqueeze(-1).expand(B, new_length) + arange_int
+            ).view(-1)
            slots = batch.slots[slot_indices]
            input_lengths = (
                input_lengths.unsqueeze(-1).expand(B, new_length) + arange_int
            ).view(-1)