Skip to content

Commit 396d5e6

Browse files
author
wangzaijun
committed
fix
1 parent eac2b60 commit 396d5e6

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

lightllm/common/basemodel/infer_struct.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,9 @@ def __init__(self):
2727
self.max_len_in_batch: int = None
2828
# max_cache_len 用于 prefill 阶段标识请求中最大 cache的kv 的长度
2929
self.max_cache_len: int = None
30+
# prefix_total_token_num 用于 prefill 阶段标识当前请求中所有已经ready的kv的长度
31+
# 的sum值, 其值等于 sum(b_ready_cache_len)
32+
self.prefix_total_token_num: int = None
3033
self.is_prefill: bool = None
3134

3235
self.mem_manager: MemoryManager = None

0 commit comments

Comments
 (0)