Unverified Commit b3c1f2e4 authored by fzyzcjy's avatar fzyzcjy Committed by GitHub
Browse files

Fix memory pool leak error (#9271)

parent be1a3cd9
...@@ -486,6 +486,11 @@ class PagedTokenToKVPoolAllocator(BaseTokenToKVPoolAllocator): ...@@ -486,6 +486,11 @@ class PagedTokenToKVPoolAllocator(BaseTokenToKVPoolAllocator):
): ):
self.merge_and_sort_free() self.merge_and_sort_free()
assert self.max_num_extend_tokens_next_power_of_2 >= extend_num_tokens, (
f"{self.max_num_extend_tokens_next_power_of_2=} >= {extend_num_tokens=} does not hold. "
f"If this happens in PD, consider letting chunked_prefill_size in D be as large as in P"
)
out_indices = torch.empty( out_indices = torch.empty(
(extend_num_tokens,), dtype=torch.int64, device=self.device (extend_num_tokens,), dtype=torch.int64, device=self.device
) )
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment