Skip to content

Commit 3bac7a2

Browse files
author
wangzaijun
committed
fix health check for pd mode
1 parent a5dcdea commit 3bac7a2

File tree

2 files changed

+9
-2
lines changed

2 files changed

+9
-2
lines changed

lightllm/server/api_server.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -113,7 +113,7 @@ async def healthcheck(request: Request):
113113

114114
from lightllm.utils.health_check import health_check
115115

116-
if await health_check(g_objs.httpserver_manager, request):
116+
if await health_check(g_objs.args, g_objs.httpserver_manager, request):
117117
return JSONResponse({"message": "Ok"}, status_code=200)
118118
else:
119119
return JSONResponse({"message": "Error"}, status_code=404)

lightllm/utils/health_check.py

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,18 +4,25 @@
44
from lightllm.server.multimodal_params import MultimodalParams
55
from lightllm.server.httpserver.manager import HttpServerManager
66
from fastapi import Request
7+
from lightllm.server.req_id_generator import ReqIDGenerator
78
from lightllm.utils.log_utils import init_logger
89

910
logger = init_logger(__name__)
1011

1112

12-
async def health_check(httpserver_manager: HttpServerManager, request: Request):
13+
_g_health_req_id_gen = ReqIDGenerator()
14+
_g_health_req_id_gen.generate_id()
15+
16+
17+
async def health_check(args, httpserver_manager: HttpServerManager, request: Request):
1318
try:
1419
request_dict = {"inputs": "你好!", "parameters": {"do_sample": True, "temperature": 0.8, "max_new_tokens": 2}}
1520
prompt = request_dict.pop("inputs")
1621
sample_params_dict = request_dict["parameters"]
1722
sampling_params = SamplingParams(**sample_params_dict)
1823
sampling_params.verify()
24+
if args.run_mode in ["prefill", "decode"]:
25+
sampling_params.group_request_id = -_g_health_req_id_gen.generate_id() # health monitor 的 id 是负的
1926
multimodal_params_dict = request_dict.get("multimodal_params", {})
2027
multimodal_params = MultimodalParams(**multimodal_params_dict)
2128

0 commit comments

Comments
 (0)