Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
3520f75f
"docs/vscode:/vscode.git/clone" did not exist on "62b3c9e06ab13a4b79f2f7e5a12133c52541e232"
Unverified
Commit
3520f75f
authored
Jul 29, 2024
by
Liangsheng Yin
Committed by
GitHub
Jul 29, 2024
Browse files
Remove inf value for chunked prefill size (#812)
parent
c8e9fed8
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
6 additions
and
5 deletions
+6
-5
python/sglang/srt/managers/controller/tp_worker.py
python/sglang/srt/managers/controller/tp_worker.py
+5
-2
python/sglang/srt/server_args.py
python/sglang/srt/server_args.py
+1
-3
No files found.
python/sglang/srt/managers/controller/tp_worker.py
View file @
3520f75f
...
...
@@ -442,8 +442,11 @@ class ModelTpServer:
else
:
# Add this request to the running batch
if
(
new_batch_input_tokens
+
req
.
extend_input_len
<=
self
.
chunked_prefill_size
self
.
chunked_prefill_size
is
None
or
(
new_batch_input_tokens
+
req
.
extend_input_len
<=
self
.
chunked_prefill_size
)
or
(
req
.
return_logprob
and
req
.
normalized_prompt_logprob
is
None
)
...
...
python/sglang/srt/server_args.py
View file @
3520f75f
...
...
@@ -87,8 +87,6 @@ class ServerArgs:
node_rank
:
Optional
[
int
]
=
None
def
__post_init__
(
self
):
if
self
.
chunked_prefill_size
is
None
:
self
.
chunked_prefill_size
=
1
<<
30
if
self
.
tokenizer_path
is
None
:
self
.
tokenizer_path
=
self
.
model_path
if
self
.
mem_fraction_static
is
None
:
...
...
@@ -414,7 +412,7 @@ class ServerArgs:
),
"multi-node data parallel is not supported"
assert
not
(
self
.
chunked_prefill_size
<
(
1
<<
30
)
and
self
.
disable_radix_cache
self
.
chunked_prefill_size
is
not
None
and
self
.
disable_radix_cache
),
"chunked prefill is not supported with radix cache disabled currently"
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment