File tree Expand file tree Collapse file tree 1 file changed +4
-2
lines changed
vllm/distributed/kv_transfer/kv_connector/v1 Expand file tree Collapse file tree 1 file changed +4
-2
lines changed Original file line number Diff line number Diff line change @@ -845,7 +845,9 @@ def _read_blocks(
845845 # just notify P worker that we have the blocks we need.
846846 num_local_blocks = len (local_block_ids )
847847 if num_local_blocks == 0 :
848- self .nixl_wrapper .send_notif (dst_engine_id , notif_msg = notif_id )
848+ remote_rank = self .rank // tp_ratio
849+ remote_agent = self ._remote_agents [dst_engine_id ][remote_rank ]
850+ self .nixl_wrapper .send_notif (remote_agent , notif_msg = notif_id )
849851 return
850852
851853 # Partial prefix cache hit: just read uncomputed blocks.
@@ -912,7 +914,7 @@ def _read_blocks(
912914 self .nixl_wrapper .transfer (handle )
913915
914916 # Use handle to check completion in future step().
915- # TODO surface xfer elapsed time
917+ # TODO (NickLucche) surface xfer elapsed time
916918 self ._recving_transfers [request_id ].append (
917919 (handle , time .perf_counter ()))
918920
You can’t perform that action at this time.
0 commit comments