Skip to content

Commit e1cef4e

Browse files
committed
refact mla 1
Signed-off-by: whx-sjtu <[email protected]>
1 parent 103654c commit e1cef4e

File tree

3 files changed

+116
-241
lines changed

3 files changed

+116
-241
lines changed

vllm_ascend/ascend_config.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -50,6 +50,9 @@ def __init__(self, vllm_config):
5050
self.enable_shared_expert_dp = additional_config.get(
5151
"enable_shared_expert_dp", True
5252
) and not self.torchair_graph_config.enabled and vllm_config.parallel_config.enable_expert_parallel
53+
self.enable_mla_prefetch = additional_config.get(
54+
"enable_mla_prefetch", True
55+
)
5356

5457

5558
class TorchairGraphConfig:

0 commit comments

Comments
 (0)