Skip to content

Commit b52daf0

Browse files
committed
change position of block_size
1 parent d015bbe commit b52daf0

File tree

2 files changed

+5
-5
lines changed

2 files changed

+5
-5
lines changed

vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1009,8 +1009,8 @@ def sync_recved_kv_to_device(self, req_id: str, meta: ReqMeta):
10091009
assert self.copy_blocks is not None
10101010

10111011
local_block_ids = meta.local_block_ids
1012-
self.copy_blocks(self.host_xfer_buffers, self.device_kv_caches,
1013-
local_block_ids, local_block_ids, "h2d", self.block_size)
1012+
self.copy_blocks(self.block_size, self.host_xfer_buffers, self.device_kv_caches,
1013+
local_block_ids, local_block_ids, "h2d")
10141014
if logger.isEnabledFor(logging.DEBUG):
10151015
logger.debug(
10161016
"synced recved kv of request[%s] to device kv buffer,"
@@ -1029,8 +1029,8 @@ def save_kv_to_host(self, metadata: NixlConnectorMetadata):
10291029
"local_block_ids: %s. ", req_id,
10301030
",".join(map(str, meta.local_block_ids)))
10311031
# blocking
1032-
self.copy_blocks(self.device_kv_caches, self.host_xfer_buffers,
1033-
meta.local_block_ids, meta.local_block_ids, "d2h", self.block_size)
1032+
self.copy_blocks(self.block_size, self.device_kv_caches, self.host_xfer_buffers,
1033+
meta.local_block_ids, meta.local_block_ids, "d2h")
10341034

10351035
def get_finished(self) -> tuple[set[str], set[str]]:
10361036
"""

vllm/v1/worker/hpu_model_runner.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2515,12 +2515,12 @@ def _swap_out_hpu_blocks(
25152515
cpu_cache[cpu_block_indices] = hpu_cache[hpu_block_indices].cpu()
25162516

25172517
def copy_kv_blocks(
2518+
block_size: int,
25182519
src_kv_caches: dict[str, torch.Tensor],
25192520
dst_kv_caches: dict[str, torch.Tensor],
25202521
src_block_ids: list[int],
25212522
dst_block_ids: list[int],
25222523
direction: Literal["h2d", "d2h"],
2523-
block_size: int
25242524
) -> None:
25252525
"""Copy kv blocks between different buffers."""
25262526
if not src_kv_caches or not dst_kv_caches or \

0 commit comments

Comments
 (0)