Skip to content

Commit a01bd90

Browse files
committed
fix
1 parent 89e4068 commit a01bd90

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/decode_node_impl/decode_trans_process.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,7 @@ def _handle_prefill_join(
5959
src_id=node_info.prefill_id, dest_id=node_info.decode_id, is_server=False, store=store_client
6060
)
6161
comm = PyNcclCommunicator(group, node_info.decode_device_id)
62-
connect_id_to_comm[node_info.prefill_id] = comm
62+
connect_id_to_comm[node_info.connect_id] = comm
6363
logger.info(f"{node_info} kv trans connected")
6464
task_out_queue.put("nccl_ok")
6565
except Exception as e:
@@ -84,13 +84,13 @@ def _init_env(args, device_id: int, task_in_queue: mp.Queue, task_out_queue: mp.
8484
task: Union[KVMoveTaskGroup, PDTransJoinInfo, PDTransLeaveInfo] = task_in_queue.get()
8585
if isinstance(task, KVMoveTaskGroup):
8686
_handle_kvmove_task(
87-
task, task_out_queue, mem_managers, connect_id_to_comm, task.connect_id, dp_size_in_node
87+
task.tasks, task_out_queue, mem_managers, connect_id_to_comm, task.connect_id, dp_size_in_node
8888
)
8989
elif isinstance(task, PDTransJoinInfo):
9090
_handle_prefill_join(task, task_out_queue, connect_id_to_comm)
9191
elif isinstance(task, PDTransLeaveInfo):
9292
if task.connect_id in connect_id_to_comm:
93-
connect_id_to_comm[task.prefill_id].destroy()
93+
connect_id_to_comm[task.connect_id].destroy()
9494
logger.info(f"destory {task} nccl communicator.")
9595
else:
9696
logger.info(f"no connect_id {task.connect_id} found in connect_id_to_comm")

lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/prefill_node_impl/prefill_kv_move_manager.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -189,7 +189,7 @@ def remove_trans_obj(self, connect_id):
189189
trans_obj = self.connect_id_to_trans_obj.pop(connect_id, None)
190190
if trans_obj is not None:
191191
trans_obj.set_has_error()
192-
logger.error(f"remove tran obj id {trans_obj.decode_node_id}")
192+
logger.error(f"remove tran obj decode_node_id {trans_obj.decode_node_id}")
193193
return
194194

195195
def __get_trans_obj(self, task: KVMoveTask):

0 commit comments

Comments
 (0)