Skip to content

Commit 6ef4dcd

Browse files
committed
fix first version
1 parent df1d500 commit 6ef4dcd

File tree

1 file changed

+14
-15
lines changed

1 file changed

+14
-15
lines changed

lightllm/server/router/model_infer/mode_backend/multi_level_kv_cache.py

Lines changed: 14 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -50,23 +50,22 @@ def handle_finished_reqs(self, finished_reqs: List[InferReq]) -> List[InferReq]:
5050
# 如果请求已经完成了 cpu cache 的任务,则满足了退出条件
5151
if req.cpu_cache_task_status.is_finished():
5252
true_finished_reqs.append(req)
53+
elif req.cpu_cache_task_status.is_running():
54+
# 如果请求已经发起过卸载任务,则在当前轮不进行处理
5355
continue
54-
55-
# 如果请求已经发起过卸载任务,则在当前轮不进行处理
56-
if req.cpu_cache_task_status.is_running():
57-
continue
58-
59-
# 发起将请求的 kv cache 卸载到 cpu cache 中的任务
60-
trans_task = self._start_kv_cache_offload_task(
61-
req=req, cpu_kv_cache_stream=g_infer_context.get_cpu_kv_cache_stream()
62-
)
63-
64-
if trans_task is not None:
65-
self.cpu_cache_handle_queue.append(trans_task)
6656
else:
67-
true_finished_reqs.append(req)
68-
69-
return true_finished_reqs
57+
assert req.cpu_cache_task_status.is_not_started()
58+
# 发起将请求的 kv cache 卸载到 cpu cache 中的任务
59+
trans_task = self._start_kv_cache_offload_task(
60+
req=req, cpu_kv_cache_stream=g_infer_context.get_cpu_kv_cache_stream()
61+
)
62+
63+
if trans_task is not None:
64+
self.cpu_cache_handle_queue.append(trans_task)
65+
else:
66+
true_finished_reqs.append(req)
67+
68+
return true_finished_reqs
7069
else:
7170
return finished_reqs
7271

0 commit comments

Comments
 (0)