Fix chunked prefill size validation for disabled state (#8973)

Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>

Fix chunked prefill size validation for disabled state (#8973)
Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
3bffe112 · 633WHU · GitHub · 44426e54 · 3bffe112
Unverified Commit 3bffe112 authored Aug 12, 2025 by 633WHU Committed by GitHub Aug 11, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 3 deletions

python/sglang/srt/server_args.py python/sglang/srt/server_args.py +5 -3

No files found.
--- a/python/sglang/srt/server_args.py
+++ b/python/sglang/srt/server_args.py
@@ -1999,9 +1999,11 @@ class ServerArgs:
            ), "enable_mixed_chunk is required for speculative decoding"
        # Check chunked prefill
-        assert (
+        # Skip validation if chunked prefill is disabled (i.e., size <= 0).
-            self.chunked_prefill_size % self.page_size == 0
+        if self.chunked_prefill_size > 0:
-        ), "chunked_prefill_size must be divisible by page_size"
+            assert (
+                self.chunked_prefill_size % self.page_size == 0
+            ), "chunked_prefill_size must be divisible by page_size"
    def check_lora_server_args(self):
        assert self.max_loras_per_batch > 0, "max_loras_per_batch must be positive"