Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
68f8b60d
"tutorials/vscode:/vscode.git/clone" did not exist on "2cf4bd0acf479d8d51347b6b524aebd3fdcc8d9f"
Unverified
Commit
68f8b60d
authored
Oct 07, 2024
by
Ke Bao
Committed by
GitHub
Oct 07, 2024
Browse files
Fix chunked prefill condition (#1594)
parent
6a5b352a
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
15 additions
and
1 deletion
+15
-1
python/sglang/srt/managers/schedule_policy.py
python/sglang/srt/managers/schedule_policy.py
+4
-1
test/srt/test_chunked_prefill.py
test/srt/test_chunked_prefill.py
+11
-0
No files found.
python/sglang/srt/managers/schedule_policy.py
View file @
68f8b60d
...
...
@@ -249,7 +249,10 @@ class PrefillAdder:
return
AddReqResult
.
NO_TOKEN
tokens_freed
+=
tokens_occupied
if
req
.
extend_input_len
<=
self
.
rem_chunk_tokens
:
if
(
self
.
rem_chunk_tokens
is
None
or
req
.
extend_input_len
<=
self
.
rem_chunk_tokens
):
self
.
can_run_list
.
append
(
req
)
self
.
_prefill_one_req
(
0
,
...
...
test/srt/test_chunked_prefill.py
View file @
68f8b60d
...
...
@@ -8,6 +8,7 @@ from sglang.test.test_utils import (
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
popen_launch_server
,
run_bench_serving
,
)
...
...
@@ -62,6 +63,16 @@ class TestChunkedPrefill(unittest.TestCase):
disable_radix_cache
=
False
,
enable_mixed_chunk
=
False
,
chunked_prefill_size
=-
1
)
def
test_no_chunked_prefill_without_radix_cache
(
self
):
res
=
run_bench_serving
(
model
=
DEFAULT_MODEL_NAME_FOR_TEST
,
num_prompts
=
10
,
request_rate
=
float
(
"inf"
),
other_server_args
=
[
"--disable-radix-cache"
,
"--chunked-prefill-size"
,
"-1"
],
)
assert
res
[
"completed"
]
==
10
if
__name__
==
"__main__"
:
unittest
.
main
()
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment