add proctitle for tokenizers (#9952)
Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
This commit is contained in:
@@ -29,6 +29,8 @@ import time
|
|||||||
from http import HTTPStatus
|
from http import HTTPStatus
|
||||||
from typing import Any, AsyncIterator, Callable, Dict, List, Optional
|
from typing import Any, AsyncIterator, Callable, Dict, List, Optional
|
||||||
|
|
||||||
|
import setproctitle
|
||||||
|
|
||||||
# Fix a bug of Python threading
|
# Fix a bug of Python threading
|
||||||
setattr(threading, "_register_atexit", lambda *args, **kwargs: None)
|
setattr(threading, "_register_atexit", lambda *args, **kwargs: None)
|
||||||
|
|
||||||
@@ -1166,6 +1168,7 @@ def launch_server(
|
|||||||
2. Inter-process communication is done through IPC (each process uses a different port) via the ZMQ library.
|
2. Inter-process communication is done through IPC (each process uses a different port) via the ZMQ library.
|
||||||
"""
|
"""
|
||||||
if server_args.tokenizer_worker_num > 1:
|
if server_args.tokenizer_worker_num > 1:
|
||||||
|
setproctitle.setproctitle(f"sglang::http_server/multi_tokenizer_router")
|
||||||
port_args = PortArgs.init_new(server_args)
|
port_args = PortArgs.init_new(server_args)
|
||||||
port_args.tokenizer_worker_ipc_name = (
|
port_args.tokenizer_worker_ipc_name = (
|
||||||
f"ipc://{tempfile.NamedTemporaryFile(delete=False).name}"
|
f"ipc://{tempfile.NamedTemporaryFile(delete=False).name}"
|
||||||
@@ -1174,6 +1177,7 @@ def launch_server(
|
|||||||
server_args=server_args, port_args=port_args
|
server_args=server_args, port_args=port_args
|
||||||
)
|
)
|
||||||
else:
|
else:
|
||||||
|
setproctitle.setproctitle(f"sglang::http_server/tokenizer_manager")
|
||||||
tokenizer_manager, template_manager, scheduler_info = _launch_subprocesses(
|
tokenizer_manager, template_manager, scheduler_info = _launch_subprocesses(
|
||||||
server_args=server_args,
|
server_args=server_args,
|
||||||
)
|
)
|
||||||
|
|||||||
@@ -23,6 +23,7 @@ import threading
|
|||||||
from multiprocessing import shared_memory
|
from multiprocessing import shared_memory
|
||||||
from typing import Dict
|
from typing import Dict
|
||||||
|
|
||||||
|
import setproctitle
|
||||||
import zmq
|
import zmq
|
||||||
import zmq.asyncio
|
import zmq.asyncio
|
||||||
|
|
||||||
@@ -476,6 +477,9 @@ class MultiTokenizerManager(TokenizerManager, MultiTokenizerMixin):
|
|||||||
server_args: ServerArgs,
|
server_args: ServerArgs,
|
||||||
port_args: PortArgs,
|
port_args: PortArgs,
|
||||||
):
|
):
|
||||||
|
setproctitle.setproctitle(
|
||||||
|
f"sglang::http_server/multi_tokenizer_manager:{os.getpid()}"
|
||||||
|
)
|
||||||
# prevent init prefill bootstrapserver again
|
# prevent init prefill bootstrapserver again
|
||||||
disaggregation_mode = server_args.disaggregation_mode
|
disaggregation_mode = server_args.disaggregation_mode
|
||||||
server_args.disaggregation_mode = "null"
|
server_args.disaggregation_mode = "null"
|
||||||
|
|||||||
Reference in New Issue
Block a user