We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 5fb197a commit 1ae8541Copy full SHA for 1ae8541
lightllm/server/router/model_infer/mode_backend/chunked_prefill/impl.py
@@ -40,8 +40,12 @@ def __init__(self) -> None:
40
41
# 在 mtp 模式下切换绑定的prefill 和 decode 函数
42
if get_env_start_args().mtp_mode:
43
- self.prefill = self.prefill_mtp_eagle
44
- self.decode = self.decode_mtp_eagle
+ if get_env_start_args().mtp_mode == "deepseekv3_eagle":
+ self.prefill = self.prefill_mtp_eagle
45
+ self.decode = self.decode_mtp_eagle
46
+ else:
47
+ self.prefill = self.prefill_mtp_vanilla
48
+ self.decode = self.decode_mtp_vanilla
49
else:
50
self.prefill = self.prefill_normal
51
self.decode = self.decode_normal
0 commit comments