Skip to content

Commit e4e222f

Browse files
committed
fix pause reqs
1 parent 971936e commit e4e222f

File tree

2 files changed

+4
-3
lines changed

2 files changed

+4
-3
lines changed

lightllm/server/router/manager.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -307,7 +307,7 @@ async def _step(self):
307307
paused_reqs = select_paused_reqs(
308308
self.running_batch, self.pause_strategy, self.req_queue, self.max_total_token_num
309309
)
310-
await self._pause_reqs(self.running_batch, paused_reqs)
310+
await self._pause_reqs(paused_reqs)
311311
logger.debug(f"pasued req num: {self.req_queue.get_paused_req_num()}")
312312
self.has_wait_tokens = 0
313313
return
@@ -342,9 +342,9 @@ async def _decode_batch(self, batch: Batch):
342342
)
343343
return
344344

345-
async def _pause_reqs(self, batch: Batch, pasue_reqs):
345+
async def _pause_reqs(self, pasue_reqs):
346346
pasue_req_ids = [r.request_id for r in pasue_reqs]
347-
await self.model_rpc_client.pause_reqs(batch.batch_id, pasue_req_ids)
347+
await self.model_rpc_client.pause_reqs(pasue_req_ids)
348348
return
349349

350350
def _filter_runing_batch(self):

lightllm/server/router/model_infer/mode_backend/chunked_prefill/impl.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -54,6 +54,7 @@ def post_handel(self, run_reqs: List[InferReq], next_token_ids, next_token_logpr
5454

5555
req_obj.cur_kv_len = len(req_obj.get_chuncked_input_token_ids())
5656
if req_obj.cur_kv_len < req_obj.get_cur_total_len():
57+
req_obj.shm_req.shm_cur_kv_len = req_obj.cur_kv_len
5758
continue
5859

5960
req_obj.set_next_gen_token_id(next_token_id, next_token_logprob)

0 commit comments

Comments
 (0)