File tree Expand file tree Collapse file tree 1 file changed +5
-2
lines changed Expand file tree Collapse file tree 1 file changed +5
-2
lines changed Original file line number Diff line number Diff line change 25
25
from vllm .attention .backends .abstract import (AttentionImpl , AttentionLayer ,
26
26
AttentionType )
27
27
from vllm .attention .backends .utils import PAD_SLOT_ID
28
+ from vllm .config import VllmConfig
28
29
from vllm .utils import cdiv
29
30
30
31
from vllm_ascend .attention .attention_v1 import (AscendAttentionBackend ,
@@ -97,8 +98,10 @@ class AscendTorchairMetadata(AscendMetadata):
97
98
98
99
class AscendAttentionTorchairMetadataBuilder (AscendAttentionMetadataBuilder ):
99
100
100
- def __init__ (self , runner ):
101
- super ().__init__ (runner )
101
+ def __init__ (self ,
102
+ vllm_config : VllmConfig ,
103
+ device : torch .device ,):
104
+ super ().__init__ (vllm_config , device )
102
105
self .max_num_blocks_per_req = cdiv (
103
106
self .model_config .max_model_len ,
104
107
self .vllm_config .cache_config .block_size )
You can’t perform that action at this time.
0 commit comments