Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
b050d928
Unverified
Commit
b050d928
authored
Jul 18, 2024
by
zhyncs
Committed by
GitHub
Jul 18, 2024
Browse files
fix: set ulimit -n 65535 (#647)
parent
6a4dc996
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
35 additions
and
5 deletions
+35
-5
python/sglang/srt/server.py
python/sglang/srt/server.py
+35
-5
No files found.
python/sglang/srt/server.py
View file @
b050d928
...
@@ -145,9 +145,35 @@ def _set_global_server_args(server_args: ServerArgs):
...
@@ -145,9 +145,35 @@ def _set_global_server_args(server_args: ServerArgs):
}
}
def
launch_server
(
server_args
:
ServerArgs
,
def
_set_ulimit
(
target_soft_limit
=
65535
):
model_overide_args
:
Optional
[
dict
]
=
None
,
import
resource
pipe_finish_writer
:
Optional
[
mp
.
connection
.
Connection
]
=
None
):
resource_type
=
resource
.
RLIMIT_NOFILE
current_soft
,
current_hard
=
resource
.
getrlimit
(
resource_type
)
if
current_soft
>=
target_soft_limit
:
logger
.
info
(
f
"Current limits are already sufficient: soft=
{
current_soft
}
, hard=
{
current_hard
}
"
)
else
:
try
:
resource
.
setrlimit
(
resource_type
,
(
target_soft_limit
,
current_hard
))
new_soft
,
new_hard
=
resource
.
getrlimit
(
resource_type
)
logger
.
info
(
f
"Successfully set new limits: soft=
{
new_soft
}
, hard=
{
new_hard
}
"
)
except
ValueError
as
e
:
logger
.
warn
(
f
"Failed to set new limits:
{
e
}
"
)
logger
.
info
(
f
"Limits remain unchanged: soft=
{
current_soft
}
, hard=
{
current_hard
}
"
)
def
launch_server
(
server_args
:
ServerArgs
,
model_overide_args
:
Optional
[
dict
]
=
None
,
pipe_finish_writer
:
Optional
[
mp
.
connection
.
Connection
]
=
None
,
):
"""Launch an HTTP server."""
"""Launch an HTTP server."""
global
tokenizer_manager
global
tokenizer_manager
...
@@ -160,6 +186,7 @@ def launch_server(server_args: ServerArgs,
...
@@ -160,6 +186,7 @@ def launch_server(server_args: ServerArgs,
os
.
environ
[
"TF_CPP_MIN_LOG_LEVEL"
]
=
"3"
os
.
environ
[
"TF_CPP_MIN_LOG_LEVEL"
]
=
"3"
os
.
environ
[
"NCCL_CUMEM_ENABLE"
]
=
"0"
os
.
environ
[
"NCCL_CUMEM_ENABLE"
]
=
"0"
os
.
environ
[
"NCCL_NVLS_ENABLE"
]
=
"0"
os
.
environ
[
"NCCL_NVLS_ENABLE"
]
=
"0"
_set_ulimit
()
if
server_args
.
show_time_cost
:
if
server_args
.
show_time_cost
:
enable_show_time_cost
()
enable_show_time_cost
()
if
server_args
.
disable_disk_cache
:
if
server_args
.
disable_disk_cache
:
...
@@ -248,7 +275,8 @@ def launch_server(server_args: ServerArgs,
...
@@ -248,7 +275,8 @@ def launch_server(server_args: ServerArgs,
proc_controller
.
kill
()
proc_controller
.
kill
()
proc_detoken
.
kill
()
proc_detoken
.
kill
()
print
(
print
(
f
"Initialization failed. controller_init_state:
{
controller_init_state
}
"
,
flush
=
True
f
"Initialization failed. controller_init_state:
{
controller_init_state
}
"
,
flush
=
True
,
)
)
print
(
print
(
f
"Initialization failed. detoken_init_state:
{
detoken_init_state
}
"
,
f
"Initialization failed. detoken_init_state:
{
detoken_init_state
}
"
,
...
@@ -261,7 +289,9 @@ def launch_server(server_args: ServerArgs,
...
@@ -261,7 +289,9 @@ def launch_server(server_args: ServerArgs,
app
.
add_middleware
(
APIKeyValidatorMiddleware
,
api_key
=
server_args
.
api_key
)
app
.
add_middleware
(
APIKeyValidatorMiddleware
,
api_key
=
server_args
.
api_key
)
# Send a warmup request
# Send a warmup request
t
=
threading
.
Thread
(
target
=
_wait_and_warmup
,
args
=
(
server_args
,
pipe_finish_writer
))
t
=
threading
.
Thread
(
target
=
_wait_and_warmup
,
args
=
(
server_args
,
pipe_finish_writer
)
)
t
.
start
()
t
.
start
()
# Listen for requests
# Listen for requests
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment