Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
dd650e0e
Unverified
Commit
dd650e0e
authored
Aug 08, 2025
by
Zilin Zhu
Committed by
GitHub
Aug 08, 2025
Browse files
[RL] fix skip_server_warmup and rl health_generate logic (#8757)
parent
a9471542
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
12 additions
and
1 deletion
+12
-1
python/sglang/srt/entrypoints/http_server.py
python/sglang/srt/entrypoints/http_server.py
+2
-0
python/sglang/srt/managers/scheduler.py
python/sglang/srt/managers/scheduler.py
+4
-1
python/sglang/srt/managers/scheduler_update_weights_mixin.py
python/sglang/srt/managers/scheduler_update_weights_mixin.py
+6
-0
No files found.
python/sglang/srt/entrypoints/http_server.py
View file @
dd650e0e
...
...
@@ -1172,6 +1172,8 @@ def _wait_and_warmup(
pipe_finish_writer
,
):
return
else
:
_global_state
.
tokenizer_manager
.
server_status
=
ServerStatus
.
Up
logger
.
info
(
"The server is fired up and ready to roll!"
)
...
...
python/sglang/srt/managers/scheduler.py
View file @
dd650e0e
...
...
@@ -473,6 +473,7 @@ class Scheduler(
self
.
memory_saver_adapter
=
TorchMemorySaverAdapter
.
create
(
enable
=
server_args
.
enable_memory_saver
)
self
.
offload_tags
=
set
()
self
.
init_profier
()
self
.
recv_skipper
=
SchedulerRecvSkipper
.
maybe_create
(
server_args
)
...
...
@@ -1040,7 +1041,9 @@ class Scheduler(
for
recv_req
in
recv_reqs
:
# If it is a health check generation request and there are running requests, ignore it.
if
is_health_check_generate_req
(
recv_req
)
and
(
self
.
chunked_req
is
not
None
or
not
self
.
running_batch
.
is_empty
()
self
.
chunked_req
is
not
None
or
not
self
.
running_batch
.
is_empty
()
or
len
(
self
.
offload_tags
)
>
0
):
self
.
return_health_check_ct
+=
1
continue
...
...
python/sglang/srt/managers/scheduler_update_weights_mixin.py
View file @
dd650e0e
...
...
@@ -78,6 +78,9 @@ class SchedulerUpdateWeightsMixin:
if
tags
is
None
or
len
(
tags
)
==
0
:
tags
=
[
GPU_MEMORY_TYPE_WEIGHTS
,
GPU_MEMORY_TYPE_KV_CACHE
]
for
tag
in
tags
:
self
.
offload_tags
.
add
(
tag
)
if
GPU_MEMORY_TYPE_KV_CACHE
in
tags
:
self
.
memory_saver_adapter
.
pause
(
GPU_MEMORY_TYPE_KV_CACHE
)
self
.
flush_cache
()
...
...
@@ -97,6 +100,9 @@ class SchedulerUpdateWeightsMixin:
if
tags
is
None
or
len
(
tags
)
==
0
:
tags
=
[
GPU_MEMORY_TYPE_WEIGHTS
,
GPU_MEMORY_TYPE_KV_CACHE
]
for
tag
in
tags
:
self
.
offload_tags
.
remove
(
tag
)
if
GPU_MEMORY_TYPE_WEIGHTS
in
tags
:
self
.
memory_saver_adapter
.
resume
(
GPU_MEMORY_TYPE_WEIGHTS
)
torch
.
distributed
.
barrier
(
self
.
tp_cpu_group
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment