Skip to content

Commit 0795d72

Browse files
committed
write mem manager to shm
1 parent 7eef57f commit 0795d72

File tree

1 file changed

+8
-0
lines changed

1 file changed

+8
-0
lines changed

lightllm/server/router/model_infer/mode_backend/base_backend.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -218,6 +218,14 @@ def init_model(self, kvargs):
218218
if self.args.mtp_mode:
219219
self.init_mtp_draft_model(kvargs)
220220

221+
# 如果存在需要跨进程使用mem manger的特性,则将mem manager写入到 shm中,方便
222+
# 读取
223+
if (
224+
self.args.run_mode in ["nixl_prefill", "nixl_decode", "prefill", "decode"]
225+
or self.args.enable_dp_prompt_cache_fetch
226+
):
227+
self.model.mem_manager.write_to_shm()
228+
221229
# 启动infer_loop_thread, 启动两个线程进行推理,对于具备双batch推理折叠得场景
222230
# 可以降低 cpu overhead,大幅提升gpu得使用率。
223231
self.infer_loop_thread = threading.Thread(target=self.infer_loop, daemon=True)

0 commit comments

Comments
 (0)