4141from .multimodal_params import MultimodalParams
4242from .httpserver .manager import HttpServerManager
4343from .httpserver_for_pd_master .manager import HttpServerManagerForPDMaster
44- from .api_lightllm import lightllm_get_score , lightllm_pd_generate_stream
44+ from .api_lightllm import lightllm_get_score
4545from lightllm .utils .envs_utils import get_env_start_args , get_lightllm_websocket_max_message_size
4646from lightllm .utils .log_utils import init_logger
47+ from lightllm .utils .error_utils import ServerBusyError
4748from lightllm .server .metrics .manager import MetricClient
4849from lightllm .utils .envs_utils import get_unique_server_name
4950from dataclasses import dataclass
@@ -136,6 +137,9 @@ def get_model_name():
136137@app .get ("/health" , summary = "Check server health" )
137138@app .head ("/health" , summary = "Check server health" )
138139async def healthcheck (request : Request ):
140+ if g_objs .args .run_mode == "pd_master" :
141+ return JSONResponse ({"message" : "Ok" }, status_code = 200 )
142+
139143 if os .environ .get ("DEBUG_HEALTHCHECK_RETURN_FAIL" ) == "true" :
140144 return JSONResponse ({"message" : "Error" }, status_code = 503 )
141145 from lightllm .utils .health_check import health_check , health_obj
@@ -175,6 +179,9 @@ async def token_load(request: Request):
175179async def generate (request : Request ) -> Response :
176180 try :
177181 return await g_objs .g_generate_func (request , g_objs .httpserver_manager )
182+ except ServerBusyError as e :
183+ logger .error ("%s" , str (e ), exc_info = True )
184+ return create_error_response (HTTPStatus .SERVICE_UNAVAILABLE , str (e ))
178185 except Exception as e :
179186 logger .error ("An error occurred: %s" , str (e ), exc_info = True )
180187 return create_error_response (HTTPStatus .EXPECTATION_FAILED , str (e ))
@@ -184,15 +191,9 @@ async def generate(request: Request) -> Response:
184191async def generate_stream (request : Request ) -> Response :
185192 try :
186193 return await g_objs .g_generate_stream_func (request , g_objs .httpserver_manager )
187- except Exception as e :
188- logger .error ("An error occurred: %s" , str (e ), exc_info = True )
189- return create_error_response (HTTPStatus .EXPECTATION_FAILED , str (e ))
190-
191-
192- @app .post ("/pd_generate_stream" )
193- async def pd_generate_stream (request : Request ) -> Response :
194- try :
195- return await lightllm_pd_generate_stream (request , g_objs .httpserver_manager )
194+ except ServerBusyError as e :
195+ logger .error ("%s" , str (e ), exc_info = True )
196+ return create_error_response (HTTPStatus .SERVICE_UNAVAILABLE , str (e ))
196197 except Exception as e :
197198 logger .error ("An error occurred: %s" , str (e ), exc_info = True )
198199 return create_error_response (HTTPStatus .EXPECTATION_FAILED , str (e ))
0 commit comments