Skip to content

Commit 5b53069

Browse files
author
wangzaijun
committed
fix
1 parent 62ccdab commit 5b53069

File tree

2 files changed

+11
-7
lines changed

2 files changed

+11
-7
lines changed

lightllm/server/router/model_infer/mode_backend/pd_nixl/decode_node_impl/decode_impl_for_dp.py

Lines changed: 9 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
from lightllm.utils.log_utils import init_logger
44
from typing import List, Tuple
55
from lightllm.server.router.model_infer.mode_backend.dp_backend.impl import DPChunkedPrefillBackend
6-
from .decode_impl import NIXLDecodeNode
6+
from .decode_impl import NIXLDecodeNode, NIXLChunckedTransTaskGroup
77

88
logger = init_logger(__name__)
99

@@ -32,13 +32,18 @@ def _decode_node_gen_trans_tasks(self, req_obj: InferReq):
3232
return NIXLDecodeNode._decode_node_gen_trans_tasks(self, req_obj=req_obj)
3333

3434
def _create_nixl_trans_task(
35-
self, req_obj: InferReq, mem_indexes: List[int], kv_start_index: int, kv_end_index: int, is_first_task: bool
35+
self,
36+
req_obj: InferReq,
37+
mem_indexes: List[int],
38+
kv_start_index: int,
39+
kv_end_index: int,
40+
group: NIXLChunckedTransTaskGroup,
3641
):
37-
return NIXLDecodeNode._decode_node_gen_trans_tasks(
42+
return NIXLDecodeNode._create_nixl_trans_task(
3843
self,
3944
req_obj=req_obj,
4045
mem_indexes=mem_indexes,
4146
kv_start_index=kv_start_index,
4247
kv_end_index=kv_end_index,
43-
is_first_task=is_first_task,
48+
group=group,
4449
)

lightllm/server/router/model_infer/mode_backend/pd_nixl/prefill_node_impl/prefill_impl_for_dp.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -27,12 +27,11 @@ def _filter_not_ready_reqs(self, req_ids: List[int]) -> List[InferReq]:
2727
def _prefill_chuncked_handle_func(
2828
self, req_obj: InferReq, next_token_id: int, next_token_prob: float, output_len: int
2929
):
30-
NIXLChunckedPrefillForPrefillNode._prefill_chuncked_handle_func(
30+
return NIXLChunckedPrefillForPrefillNode._prefill_chuncked_handle_func(
3131
self, req_obj=req_obj, next_token_id=next_token_id, next_token_prob=next_token_prob, output_len=output_len
3232
)
33-
return
3433

3534
def _create_nixl_trans_task(self, req_obj: InferReq, kv_start_index: int, kv_end_index: int):
36-
NIXLChunckedPrefillForPrefillNode._create_nixl_trans_task(
35+
return NIXLChunckedPrefillForPrefillNode._create_nixl_trans_task(
3736
self, req_obj=req_obj, kv_start_index=kv_start_index, kv_end_index=kv_end_index
3837
)

0 commit comments

Comments
 (0)