Skip to content

Commit 65acff2

Browse files
Update hpu_model_runner.py
1 parent f6d0f6a commit 65acff2

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

vllm/v1/worker/hpu_model_runner.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -573,10 +573,11 @@ def __init__(
573573
self.input_batch = InputBatch(
574574
max_num_reqs=self.scheduler_config.max_num_seqs,
575575
max_model_len=self.max_model_len,
576-
max_num_blocks_per_req=self.max_num_blocks_per_req,
576+
max_num_batched_tokens=self.max_num_tokens,
577577
device=self.device,
578578
pin_memory=self.pin_memory,
579579
vocab_size=self.model_config.get_vocab_size(),
580+
block_sizes=[self.block_size]
580581
)
581582
self.mem_margin = None
582583

0 commit comments

Comments
 (0)