Fix memory pool leak error (#9271)

b3c1f2e4 · fzyzcjy · GitHub · be1a3cd9 · b3c1f2e4
Unverified Commit b3c1f2e4 authored Aug 18, 2025 by fzyzcjy Committed by GitHub Aug 17, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 0 deletions

python/sglang/srt/mem_cache/allocator.py python/sglang/srt/mem_cache/allocator.py +5 -0

No files found.
--- a/python/sglang/srt/mem_cache/allocator.py
+++ b/python/sglang/srt/mem_cache/allocator.py
@@ -486,6 +486,11 @@ class PagedTokenToKVPoolAllocator(BaseTokenToKVPoolAllocator):
        ):
            self.merge_and_sort_free()
+        assert self.max_num_extend_tokens_next_power_of_2 >= extend_num_tokens, (
+            f"{self.max_num_extend_tokens_next_power_of_2=} >= {extend_num_tokens=} does not hold. "
+            f"If this happens in PD, consider letting chunked_prefill_size in D be as large as in P"
+        )
        out_indices = torch.empty(
            (extend_num_tokens,), dtype=torch.int64, device=self.device
        )