@@ -203,7 +203,7 @@ def get_worker(
203203 controller_addr : str = "http://localhost:21001" ,
204204 worker_id : str = str (uuid .uuid4 ())[:8 ],
205205 model_names : List [str ] = ["" ],
206- limit_worker_concurrency : int = 512 ,
206+ limit_worker_concurrency : int = 1024 ,
207207 conv_template : str = None , # type: ignore
208208 ):
209209 worker = cls (
@@ -251,6 +251,8 @@ def run(cls):
251251 parser .add_argument ("--log_level" , type = str , default = "WARNING" )
252252 # task_type
253253 parser .add_argument ("--task_type" , type = str , default = "auto" )
254+ # limit_worker_concurrency
255+ parser .add_argument ("--limit_worker_concurrency" , type = int , default = 1024 )
254256 args = parser .parse_args ()
255257 os .environ ["num_gpus" ] = str (args .num_gpus )
256258 if args .backend == "vllm" :
@@ -279,6 +281,7 @@ def run(cls):
279281 os .environ ["dtype" ] = args .dtype
280282 os .environ ["log_level" ] = args .log_level
281283 os .environ ["task_type" ] = args .task_type
284+ limit_worker_concurrency = int (args .limit_worker_concurrency )
282285 logger .remove (0 )
283286 log_level = os .getenv ("log_level" , "WARNING" )
284287 logger .add (sys .stderr , level = log_level )
@@ -291,6 +294,8 @@ def run(cls):
291294 os .environ ["WORKER_PORT" ] = str (port )
292295 os .environ ["WORKER_HOST" ] = str (local_ip )
293296 worker_addr = f"http://{ host } :{ port } "
297+ model_names = args .model_names
298+ logger .info (f"{ model_names [0 ]} args: \n { args } " )
294299
295300 @app .on_event ("startup" )
296301 async def startup ():
@@ -299,9 +304,10 @@ async def startup():
299304 worker = cls .get_worker (
300305 worker_addr = worker_addr ,
301306 model_path = args .model_name_or_path ,
302- model_names = args . model_names ,
307+ model_names = model_names ,
303308 conv_template = "chatglm3" , # TODO 默认是chatglm3用于统一处理
304309 controller_addr = controller_address ,
310+ limit_worker_concurrency = limit_worker_concurrency ,
305311 )
306312
307313 uvicorn .run (app , host = host , port = port )
0 commit comments