refact attn metadata build

weiguihua2 · weiguihua2 · commit 66e95c6d74e3 · 2025-08-19T15:06:36.000+08:00
Signed-off-by: weiguihua2 &lt;weiguihua2@huawei.com&gt;
diff --git a/vllm_ascend/attention/utils.py b/vllm_ascend/attention/utils.py
@@ -1,5 +1,5 @@
 from dataclasses import dataclass
-from typing import Any
+from typing import Any, Optional
 
 import torch
 
@@ -36,7 +36,7 @@ class AscendCommonAttentionMetadata:
 
     slot_mapping_cpu: torch.Tensor
 
-    actual_seq_lengths_q: list[int] = None
+    actual_seq_lengths_q: Optional[list[int]] = None
 
     positions: torch.Tensor = None
 
@@ -70,7 +70,7 @@ class TorchairCommonAttentionMetadata:
 
     decode_token_per_req: int
 
-    actual_seq_lengths_q: list[int] = None
+    actual_seq_lengths_q: Optional[list[int]] = None
 
     attn_mask: torch.Tensor = None
 
diff --git a/vllm_ascend/worker/model_runner_v1.py b/vllm_ascend/worker/model_runner_v1.py
@@ -812,7 +812,6 @@ def get_eagle_atten_dict(
                 attn_mask=self.attn_mask,
                 spec_attn_mask=self.spec_attn_mask,
                 attn_state=self.attn_state,
-                max_num_blocks_per_req=self.max_num_blocks_per_req,
                 decode_token_per_req=self.decode_token_per_req,
             )
             attn_metadata_i = self.attn_metadata_builder.build(

Original file line number	Diff line number	Diff line change
`@@ -812,7 +812,6 @@ def get_eagle_atten_dict(`
`812`	`812`	`attn_mask=self.attn_mask,`
`813`	`813`	`spec_attn_mask=self.spec_attn_mask,`
`814`	`814`	`attn_state=self.attn_state,`
`815`		`- max_num_blocks_per_req=self.max_num_blocks_per_req,`
`816`	`815`	`decode_token_per_req=self.decode_token_per_req,`
`817`	`816`	`)`
`818`	`817`	`attn_metadata_i = self.attn_metadata_builder.build(`