File tree Expand file tree Collapse file tree 2 files changed +8
-6
lines changed
lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/prefill_node_impl Expand file tree Collapse file tree 2 files changed +8
-6
lines changed Original file line number Diff line number Diff line change @@ -49,17 +49,17 @@ def init_custom(self):
4949 return
5050
5151 def _pre_handle_finished_reqs (self , finished_reqs ):
52- self ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (run_reqs = finished_reqs )
52+ self ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (finished_reqs = finished_reqs )
5353 return
5454
55- def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , run_reqs : List [InferReq ]):
55+ def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , finished_reqs : List [InferReq ]):
5656 # 提前在radix cache中回收相关的信息,并添加引用进行锁定,方便传输进程传输kv。
5757 if self .is_master_in_dp :
5858 logger .info ("prefill_req_handle_and_frozen_tokens" )
5959
6060 g_infer_state_lock .acquire ()
6161 try :
62- for req in run_reqs :
62+ for req in finished_reqs :
6363
6464 # 区分abort 和 正常结束的请求,正常结束的请求才发起kv传输任务。
6565 if not req .finish_status .is_finished ():
Original file line number Diff line number Diff line change @@ -19,9 +19,11 @@ def init_custom(self):
1919 return
2020
2121 def _pre_handle_finished_reqs (self , finished_reqs ):
22- self ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (run_reqs = finished_reqs )
22+ self ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (finished_reqs = finished_reqs )
2323 return
2424
25- def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , run_reqs : List [InferReq ]):
26- DPChunkedForPrefillNode ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , run_reqs = run_reqs )
25+ def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , finished_reqs : List [InferReq ]):
26+ ChunckedPrefillForPrefillNode ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (
27+ self , finished_reqs = finished_reqs
28+ )
2729 return
You can’t perform that action at this time.
0 commit comments