Skip to content

Commit 64bdc11

Browse files
committed
update mem_manager
1 parent 249dea7 commit 64bdc11

File tree

2 files changed

+10
-7
lines changed

2 files changed

+10
-7
lines changed

lightllm/common/mem_manager.py

Lines changed: 9 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -300,12 +300,15 @@ class ReadOnlyStaticsMemoryManager:
300300
读取一些统计信息
301301
"""
302302

303-
def __init__(self, global_world_size) -> None:
304-
self.gobal_world_size = global_world_size
305-
self.shared_tp_infos = [
306-
SharedInt(f"{get_unique_server_name()}_mem_manger_can_use_token_num_{rank}")
307-
for rank in range(global_world_size)
308-
]
303+
def __init__(self) -> None:
304+
args = get_env_start_args()
305+
node_world_size = args.tp // args.nnodes
306+
rank_start = args.node_rank * node_world_size
307+
rank_end = (args.node_rank + 1) * node_world_size
308+
self.shared_tp_infos = {
309+
rank: SharedInt(f"{get_unique_server_name()}_mem_manger_can_use_token_num_{rank}")
310+
for rank in range(rank_start, rank_end)
311+
}
309312

310313
def get_unrefed_token_num(self, dp_rank: int):
311314
args = get_env_start_args()

lightllm/server/router/manager.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -51,7 +51,7 @@ def __init__(self, args, router_port, detokenization_port, model_rpc_ports, metr
5151
self.max_total_token_num = args.max_total_token_num
5252
self.shm_req_manager = ShmReqManager()
5353
# 用共享内存进行共享,router 模块读取进行精确的调度估计
54-
self.read_only_statics_mem_manager = ReadOnlyStaticsMemoryManager(self.world_size)
54+
self.read_only_statics_mem_manager = ReadOnlyStaticsMemoryManager()
5555
# 初始化 radix_cache_client 用于读取 prompt cache 的管理信息
5656
self.radix_cache_client = None
5757

0 commit comments

Comments
 (0)