We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent eac2b60 commit 396d5e6Copy full SHA for 396d5e6
lightllm/common/basemodel/infer_struct.py
@@ -27,6 +27,9 @@ def __init__(self):
27
self.max_len_in_batch: int = None
28
# max_cache_len 用于 prefill 阶段标识请求中最大 cache的kv 的长度
29
self.max_cache_len: int = None
30
+ # prefix_total_token_num 用于 prefill 阶段标识当前请求中所有已经ready的kv的长度
31
+ # 的sum值, 其值等于 sum(b_ready_cache_len)
32
+ self.prefix_total_token_num: int = None
33
self.is_prefill: bool = None
34
35
self.mem_manager: MemoryManager = None
0 commit comments