Unverified Commit 2f192835 authored by youkaichao's avatar youkaichao Committed by GitHub
Browse files

[Core] latency optimization (#3890)

parent 95baec82
......@@ -328,7 +328,7 @@ class BlockSpaceManagerV1(BlockSpaceManager):
self,
seq: Sequence,
) -> bool:
token_ids_len = len(seq.data.get_token_ids())
token_ids_len = seq.data.get_len()
return token_ids_len > 0 and token_ids_len % seq.block_size == 0
def _maybe_promote_last_block(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment