Skip to content

Commit 7b7f85e

Browse files
author
wangzaijun
committed
fix
1 parent f23113f commit 7b7f85e

File tree

2 files changed

+17
-0
lines changed

2 files changed

+17
-0
lines changed

lightllm/server/router/dynamic_prompt/radix_cache.py

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -333,6 +333,18 @@ def add_node_ref_counter(self, node: TreeNode):
333333
self.evict_tree_set.add(old_node)
334334
return
335335

336+
def get_mem_index_value_by_node(self, node: TreeNode) -> Optional[torch.Tensor]:
337+
if node is None:
338+
return None
339+
340+
ans_list = []
341+
while node is not None:
342+
ans_list.append(node.token_mem_index_value)
343+
node = node.parent
344+
345+
ans_list.reverse()
346+
return torch.concat(ans_list, dim=0)
347+
336348
def get_refed_tokens_num(self):
337349
return self.refed_tokens_num.arr[0]
338350

lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/prefill_node_impl/prefill_impl.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -85,6 +85,11 @@ def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(self, finished_reqs:
8585
self.radix_cache.add_node_ref_counter(new_shared_kv_node)
8686
req.shared_kv_node = new_shared_kv_node
8787

88+
_kv_len = req.cur_kv_len
89+
_value = self.radix_cache.get_mem_index_value_by_node(new_shared_kv_node)
90+
assert len(_value) == _kv_len
91+
self.model.req_manager.req_to_token_indexs[req.req_idx][0:_kv_len] = _value
92+
8893
assert new_shared_kv_node.node_prefix_total_len == req.cur_kv_len
8994

9095
if req.shm_req.sample_params.move_kv_to_decode_node.exists:

0 commit comments

Comments
 (0)