Skip to content

Commit 5f054b2

Browse files
committed
router recv reqs update
1 parent 81c5f61 commit 5f054b2

File tree

1 file changed

+14
-6
lines changed

1 file changed

+14
-6
lines changed

lightllm/server/router/manager.py

Lines changed: 14 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -79,7 +79,7 @@ def __init__(self, args: StartArgs, router_port, detokenization_port, metric_por
7979
self.eos_id = args.eos_id
8080
self.has_wait_tokens = 0
8181
self.max_wait_tokens = args.router_max_wait_tokens
82-
context = zmq.asyncio.Context(2)
82+
context = zmq.Context(2)
8383
self.recv_from_httpserver = context.socket(zmq.PULL)
8484
self.recv_from_httpserver.bind(f"{args.zmq_mode}127.0.0.1:{router_port}")
8585

@@ -442,13 +442,21 @@ def get_used_tokens(self, dp_index):
442442
else:
443443
return self.max_total_token_num - self.read_only_statics_mem_manager.get_unrefed_token_num(dp_index)
444444

445+
def recv_reqs(self):
446+
while True:
447+
try:
448+
recv_req: GroupReqIndexes = self.recv_from_httpserver.recv_pyobj(zmq.NOBLOCK)
449+
if isinstance(recv_req, GroupReqIndexes):
450+
self.add_req(recv_req)
451+
else:
452+
assert False, f"Error Req Inf {recv_req}"
453+
except zmq.ZMQError:
454+
return
455+
445456
async def loop_for_netio_req(self):
446457
while True:
447-
recv_req: GroupReqIndexes = await self.recv_from_httpserver.recv_pyobj()
448-
if isinstance(recv_req, GroupReqIndexes):
449-
self.add_req(recv_req)
450-
else:
451-
assert False, f"Error Req Inf {recv_req}"
458+
self.recv_reqs()
459+
await asyncio.sleep(0.01)
452460

453461
def clean_up(self):
454462
return

0 commit comments

Comments
 (0)