Unverified Commit 5dfcd6c2 authored by Liangsheng Yin's avatar Liangsheng Yin Committed by GitHub
Browse files

add proctitle for tokenizers (#9952)


Co-authored-by: default avatargemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
parent 0dfd54d1
...@@ -29,6 +29,8 @@ import time ...@@ -29,6 +29,8 @@ import time
from http import HTTPStatus from http import HTTPStatus
from typing import Any, AsyncIterator, Callable, Dict, List, Optional from typing import Any, AsyncIterator, Callable, Dict, List, Optional
import setproctitle
# Fix a bug of Python threading # Fix a bug of Python threading
setattr(threading, "_register_atexit", lambda *args, **kwargs: None) setattr(threading, "_register_atexit", lambda *args, **kwargs: None)
...@@ -1166,6 +1168,7 @@ def launch_server( ...@@ -1166,6 +1168,7 @@ def launch_server(
2. Inter-process communication is done through IPC (each process uses a different port) via the ZMQ library. 2. Inter-process communication is done through IPC (each process uses a different port) via the ZMQ library.
""" """
if server_args.tokenizer_worker_num > 1: if server_args.tokenizer_worker_num > 1:
setproctitle.setproctitle(f"sglang::http_server/multi_tokenizer_router")
port_args = PortArgs.init_new(server_args) port_args = PortArgs.init_new(server_args)
port_args.tokenizer_worker_ipc_name = ( port_args.tokenizer_worker_ipc_name = (
f"ipc://{tempfile.NamedTemporaryFile(delete=False).name}" f"ipc://{tempfile.NamedTemporaryFile(delete=False).name}"
...@@ -1174,6 +1177,7 @@ def launch_server( ...@@ -1174,6 +1177,7 @@ def launch_server(
server_args=server_args, port_args=port_args server_args=server_args, port_args=port_args
) )
else: else:
setproctitle.setproctitle(f"sglang::http_server/tokenizer_manager")
tokenizer_manager, template_manager, scheduler_info = _launch_subprocesses( tokenizer_manager, template_manager, scheduler_info = _launch_subprocesses(
server_args=server_args, server_args=server_args,
) )
......
...@@ -23,6 +23,7 @@ import threading ...@@ -23,6 +23,7 @@ import threading
from multiprocessing import shared_memory from multiprocessing import shared_memory
from typing import Dict from typing import Dict
import setproctitle
import zmq import zmq
import zmq.asyncio import zmq.asyncio
...@@ -476,6 +477,9 @@ class MultiTokenizerManager(TokenizerManager, MultiTokenizerMixin): ...@@ -476,6 +477,9 @@ class MultiTokenizerManager(TokenizerManager, MultiTokenizerMixin):
server_args: ServerArgs, server_args: ServerArgs,
port_args: PortArgs, port_args: PortArgs,
): ):
setproctitle.setproctitle(
f"sglang::http_server/multi_tokenizer_manager:{os.getpid()}"
)
# prevent init prefill bootstrapserver again # prevent init prefill bootstrapserver again
disaggregation_mode = server_args.disaggregation_mode disaggregation_mode = server_args.disaggregation_mode
server_args.disaggregation_mode = "null" server_args.disaggregation_mode = "null"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment