Skip to content

Commit 355c2f1

Browse files
committed
send notif to agent_name
Signed-off-by: nicklucche <[email protected]>
1 parent ef200c0 commit 355c2f1

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -845,7 +845,9 @@ def _read_blocks(
845845
# just notify P worker that we have the blocks we need.
846846
num_local_blocks = len(local_block_ids)
847847
if num_local_blocks == 0:
848-
self.nixl_wrapper.send_notif(dst_engine_id, notif_msg=notif_id)
848+
remote_rank = self.rank // tp_ratio
849+
remote_agent = self._remote_agents[dst_engine_id][remote_rank]
850+
self.nixl_wrapper.send_notif(remote_agent, notif_msg=notif_id)
849851
return
850852

851853
# Partial prefix cache hit: just read uncomputed blocks.
@@ -912,7 +914,7 @@ def _read_blocks(
912914
self.nixl_wrapper.transfer(handle)
913915

914916
# Use handle to check completion in future step().
915-
# TODO surface xfer elapsed time
917+
# TODO (NickLucche) surface xfer elapsed time
916918
self._recving_transfers[request_id].append(
917919
(handle, time.perf_counter()))
918920

0 commit comments

Comments
 (0)