Skip to content

Commit f9a3fe2

Browse files
authored
Add setproctitle (#1024)
1 parent 914dd58 commit f9a3fe2

File tree

18 files changed

+55
-4
lines changed

18 files changed

+55
-4
lines changed

lightllm/server/api_http.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@
2525
import os
2626
from io import BytesIO
2727
import pickle
28+
import setproctitle
2829

2930
asyncio.set_event_loop_policy(uvloop.EventLoopPolicy())
3031
import ujson as json
@@ -83,6 +84,8 @@ def set_args(self, args):
8384
self.g_generate_func = lightllm_generate
8485
self.g_generate_stream_func = lightllm_generate_stream
8586

87+
setproctitle.setproctitle(f"lightllm::{get_unique_server_name()}::api_server")
88+
8689
if args.run_mode == "pd_master":
8790
self.metric_client = MetricClient(args.metric_port)
8891
self.httpserver_manager = HttpServerManagerForPDMaster(

lightllm/server/api_start.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ def normal_or_p_d_start(args):
9494

9595
if args.graph_max_len_in_batch == 0:
9696
args.graph_max_len_in_batch = args.max_req_total_len
97-
97+
9898
# mode setting check.
9999
if args.output_constraint_mode != "none":
100100
assert args.disable_dynamic_prompt_cache is False

lightllm/server/audioserver/manager.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,7 @@
55
import uvloop
66
import rpyc
77
import inspect
8+
import setproctitle
89
from typing import List
910

1011
asyncio.set_event_loop_policy(uvloop.EventLoopPolicy())
@@ -14,6 +15,7 @@
1415
from lightllm.server.multimodal_params import AudioItem
1516
from .model_infer.model_rpc import start_model_process, AudioModelRpcClient
1617
from lightllm.utils.graceful_utils import graceful_registry
18+
from lightllm.utils.envs_utils import get_unique_server_name
1719
from rpyc.utils.classic import obtain
1820

1921
logger = init_logger(__name__)
@@ -140,6 +142,7 @@ def clean_up(self):
140142
def start_audio_process(args, router_port, audio_port, cache_port, pipe_writer):
141143
# 注册graceful 退出的处理
142144
graceful_registry(inspect.currentframe().f_code.co_name)
145+
setproctitle.setproctitle(f"lightllm::{get_unique_server_name()}::audio_server")
143146

144147
try:
145148
audioserver = AudioManager(args, router_port, audio_port, cache_port)

lightllm/server/config_server/api_http.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,7 @@
22
import asyncio
33
import base64
44
import pickle
5+
import setproctitle
56
import multiprocessing as mp
67
from fastapi import FastAPI, WebSocket, WebSocketDisconnect, Request, Query
78
from threading import Lock
@@ -10,7 +11,7 @@
1011
from lightllm.utils.log_utils import init_logger
1112
from ..pd_io_struct import PD_Master_Obj
1213
from .nccl_tcp_store import start_tcp_store_server
13-
from lightllm.utils.envs_utils import get_env_start_args
14+
from lightllm.utils.envs_utils import get_env_start_args, get_unique_server_name
1415
from lightllm.utils.process_check import start_parent_check_thread
1516

1617

@@ -202,5 +203,6 @@ async def http_start_tcp_store_server(
202203
return {"status": "ok"}
203204

204205

206+
setproctitle.setproctitle(f"lightllm::{get_unique_server_name()}::config_server")
205207
logger.info("config server start_parent_check_thread...")
206208
start_parent_check_thread()

lightllm/server/config_server/nccl_tcp_store.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,11 @@
11
import psutil
22
import time
3+
import setproctitle
34
import torch.distributed as dist
45
import torch.multiprocessing as mp
56
from lightllm.utils.log_utils import init_logger
67
from lightllm.utils.process_check import start_parent_check_thread
8+
from lightllm.utils.envs_utils import get_unique_server_name
79

810
logger = init_logger(__name__)
911

@@ -26,6 +28,7 @@ def _start_tcp_store_server(nccl_store_host, nccl_store_port):
2628
start a TCPStore server.
2729
"""
2830
start_parent_check_thread()
31+
setproctitle.setproctitle(f"lightllm::{get_unique_server_name()}::nccl_tcp_store")
2932

3033
try:
3134
from torch._C._distributed_c10d import _DEFAULT_PG_NCCL_TIMEOUT

lightllm/server/detokenization/manager.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
import uvloop
22
import asyncio
3+
import setproctitle
34

45
asyncio.set_event_loop_policy(uvloop.EventLoopPolicy())
56
import zmq
@@ -15,6 +16,7 @@
1516
import pickle
1617
import time
1718
from lightllm.utils.log_utils import init_logger
19+
from lightllm.utils.envs_utils import get_unique_server_name
1820

1921
logger = init_logger(__name__)
2022

@@ -173,6 +175,7 @@ def remove_finished_reqs(self):
173175
def start_detokenization_process(args, detokenization_port, detokenization_pub_port, pipe_writer):
174176
# 注册graceful 退出的处理
175177
graceful_registry(inspect.currentframe().f_code.co_name)
178+
setproctitle.setproctitle(f"lightllm::{get_unique_server_name()}::detokenization_server")
176179

177180
try:
178181
manager = DeTokenizationManager(

lightllm/server/embed_cache/manager.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,12 @@
11
import rpyc
22
import uuid
33
import inspect
4+
import setproctitle
45
from typing import Union, Optional
56
from lightllm.utils.graceful_utils import graceful_registry
67
from lightllm.server.embed_cache.impl.naive_memory_cache import InMemoryCache
78
from rpyc.utils.classic import obtain
9+
from lightllm.utils.envs_utils import get_unique_server_name
810

911

1012
class CacheServer(rpyc.Service):
@@ -53,6 +55,7 @@ def start_cache_manager(port: int, args, pipe_writer):
5355
# 注册graceful 退出的处理
5456
graceful_registry(inspect.currentframe().f_code.co_name)
5557

58+
setproctitle.setproctitle(f"lightllm::{get_unique_server_name()}::cache_manager")
5659
manager = InMemoryCache(args)
5760
service = CacheServer(manager)
5861
from rpyc.utils.server import ThreadedServer

lightllm/server/health_monitor/manager.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
import sys
22
import uvloop
33
import asyncio
4+
import setproctitle
45

56
asyncio.set_event_loop_policy(uvloop.EventLoopPolicy())
67
import os
@@ -10,6 +11,7 @@
1011

1112
from lightllm.utils.log_utils import init_logger
1213
from lightllm.utils.graceful_utils import graceful_registry
14+
from lightllm.utils.envs_utils import get_unique_server_name
1315

1416
logger = init_logger(__name__)
1517

@@ -88,6 +90,7 @@ def get_all_cared_pids():
8890
def start_health_check_process(args, pipe_writer):
8991
# 注册graceful 退出的处理
9092
graceful_registry(inspect.currentframe().f_code.co_name)
93+
setproctitle.setproctitle(f"lightllm::{get_unique_server_name()}::health_monitor")
9194
pipe_writer.send("init ok")
9295

9396
all_process_ids = get_all_cared_pids()

lightllm/server/metrics/manager.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5,11 +5,13 @@
55
import inspect
66
import functools
77
import queue
8+
import setproctitle
89
from .metrics import Monitor
910
from prometheus_client import generate_latest
1011
from rpyc import SocketStream
1112
from lightllm.utils.log_utils import init_logger
1213
from lightllm.utils.graceful_utils import graceful_registry
14+
from lightllm.utils.envs_utils import get_unique_server_name
1315

1416
logger = init_logger(__name__)
1517

@@ -136,6 +138,7 @@ def run(self):
136138
def start_metric_manager(port: int, args, pipe_writer):
137139
# 注册graceful 退出的处理
138140
graceful_registry(inspect.currentframe().f_code.co_name)
141+
setproctitle.setproctitle(f"lightllm::{get_unique_server_name()}::metric_manager")
139142

140143
service = MetricServer(args)
141144
if args.metric_gateway is not None:

lightllm/server/router/manager.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@
44
import torch
55
import pickle
66
import inspect
7+
import setproctitle
78

89
asyncio.set_event_loop_policy(uvloop.EventLoopPolicy())
910
import zmq
@@ -507,6 +508,7 @@ def clean_up(self):
507508
def start_router_process(args, router_port, detokenization_port, metric_port, pipe_writer):
508509
# 注册 graceful 退出的处理
509510
graceful_registry(inspect.currentframe().f_code.co_name)
511+
setproctitle.setproctitle(f"lightllm::{get_unique_server_name()}::router_server")
510512
start_parent_check_thread()
511513

512514
def handle_exception(loop, context):

0 commit comments

Comments
 (0)