Skip to content

Commit 79fcc13

Browse files
authored
chuncked prefill must enable prompt cache. (#800)
1 parent 3626756 commit 79fcc13

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

lightllm/server/api_start.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -95,6 +95,10 @@ def normal_or_p_d_start(args):
9595
if args.use_dynamic_prompt_cache:
9696
assert args.token_healing_mode is False
9797

98+
# chuncked prefill 需要和 dynamic_prompt_cache 一起使能
99+
if not args.disable_chunked_prefill:
100+
assert args.use_dynamic_prompt_cache is True
101+
98102
# 部分模式还不能支持与高级动态调度算法协同,to do.
99103
if args.diverse_mode:
100104
assert args.router_token_ratio == 0.0

0 commit comments

Comments
 (0)