Skip to content

Commit 4e09ac5

Browse files
committed
refact attn metadata build
Signed-off-by: weiguihua2 <[email protected]>
1 parent 908df33 commit 4e09ac5

File tree

3 files changed

+3
-5
lines changed

3 files changed

+3
-5
lines changed

vllm_ascend/attention/mla_v1.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -287,8 +287,7 @@ def build_torchair_graph_dummy(
287287
self, common_attn_metadata: AscendCommonAttentionMetadata,) -> AscendMLAMetadata:
288288
device = self.device
289289
num_reqs = common_attn_metadata.num_reqs
290-
_, max_blocks = self.max_blocks
291-
block_table = torch.zeros((num_reqs, max_blocks),
290+
block_table = torch.zeros((num_reqs, self.max_blocks),
292291
dtype=torch.int32,
293292
device=device)
294293
block_table = self._get_graph_runner_block_tables(

vllm_ascend/torchair/torchair_attention.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -120,8 +120,7 @@ def build_torchair_graph_dummy(
120120
self, common_attn_metadata: AscendCommonAttentionMetadata) -> AscendTorchairMetadata:
121121
device = self.device
122122
num_reqs = common_attn_metadata.num_reqs
123-
_, max_blocks = self.max_blocks
124-
block_table = torch.zeros((num_reqs, max_blocks),
123+
block_table = torch.zeros((num_reqs, self.max_blocks),
125124
dtype=torch.int32,
126125
device=device)
127126
block_table = self._get_graph_runner_block_tables(

vllm_ascend/torchair/torchair_model_runner.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -78,7 +78,7 @@ def _build_attention_metadata(self, with_prefill, num_reqs, skip_attn):
7878
actual_seq_lengths_q=self.actual_seq_lengths_q,
7979
attn_mask=self.attn_mask,
8080
spec_attn_mask=self.spec_attn_mask,
81-
attn_state=self.attn_state,
81+
decode_token_per_req=self.decode_token_per_req,
8282
)
8383
attn_metadata = self.attn_metadata_builder.build_torchair_graph_dummy(common_attn_metadata)
8484
else:

0 commit comments

Comments
 (0)