Skip to content

Commit 7453390

Browse files
committed
fix
1 parent e41f365 commit 7453390

File tree

2 files changed

+10
-10
lines changed

2 files changed

+10
-10
lines changed

lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/decode_node_impl/decode_trans_process.py

Lines changed: 6 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -55,15 +55,16 @@ def _handle_prefill_join(
5555
try:
5656
logger.info(f"connect start {node_info}")
5757
store_client = TCPStore(
58-
host_name=node_info.pd_prefill_nccl_ip, port=node_info.pd_prefill_nccl_port, is_master=False, use_libuv=True, timeout=timedelta(seconds=30)
58+
host_name=node_info.pd_prefill_nccl_ip,
59+
port=node_info.pd_prefill_nccl_port,
60+
is_master=False,
61+
use_libuv=True,
62+
timeout=timedelta(seconds=30),
5963
)
6064
src_id = node_info.prefill_id
6165
dest_id = node_info.connect_id
6266
logger.info(f"connect src_id {src_id} dest_id {dest_id}")
63-
group = StatelessP2PProcessGroup.create(src_id=src_id,
64-
dest_id=dest_id,
65-
is_server=False,
66-
store=store_client)
67+
group = StatelessP2PProcessGroup.create(src_id=src_id, dest_id=dest_id, is_server=False, store=store_client)
6768
comm = PyNcclCommunicator(group, node_info.decode_device_id)
6869
connect_id_to_comm[node_info.connect_id] = comm
6970
logger.info(f"{node_info} kv trans connected")

lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/prefill_node_impl/prefill_trans_process.py

Lines changed: 4 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -61,10 +61,7 @@ def _handle_decode_join(
6161
src_id = node_info.prefill_id
6262
dest_id = node_info.connect_id
6363
logger.info(f"connect src_id {src_id} dest_id {dest_id}")
64-
group = StatelessP2PProcessGroup.create(src_id=src_id,
65-
dest_id=dest_id,
66-
is_server=True,
67-
store=store)
64+
group = StatelessP2PProcessGroup.create(src_id=src_id, dest_id=dest_id, is_server=True, store=store)
6865
comm = PyNcclCommunicator(group, node_info.prefill_device_id)
6966
connect_id_to_comm[node_info.connect_id] = comm
7067
logger.info(f"{node_info} kv trans connected!")
@@ -94,7 +91,9 @@ def _init_env(
9491
try:
9592
torch.cuda.set_device(device_id)
9693
graceful_registry(inspect.currentframe().f_code.co_name)
97-
master_store = TCPStore(host_name=store_ip, port=store_port, is_master=True, use_libuv=True, timeout=timedelta(seconds=30))
94+
master_store = TCPStore(
95+
host_name=store_ip, port=store_port, is_master=True, use_libuv=True, timeout=timedelta(seconds=30)
96+
)
9897
dp_size_in_node = max(1, args.dp // args.nnodes)
9998
task_out_queue.put("proc_start")
10099
mem_managers: List[MemoryManager] = [mem_queue.get(timeout=60) for mem_queue in mem_queues]

0 commit comments

Comments
 (0)