We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 3626756 commit 79fcc13Copy full SHA for 79fcc13
lightllm/server/api_start.py
@@ -95,6 +95,10 @@ def normal_or_p_d_start(args):
95
if args.use_dynamic_prompt_cache:
96
assert args.token_healing_mode is False
97
98
+ # chuncked prefill 需要和 dynamic_prompt_cache 一起使能
99
+ if not args.disable_chunked_prefill:
100
+ assert args.use_dynamic_prompt_cache is True
101
+
102
# 部分模式还不能支持与高级动态调度算法协同,to do.
103
if args.diverse_mode:
104
assert args.router_token_ratio == 0.0
0 commit comments