We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1de0baa commit 46fb03dCopy full SHA for 46fb03d
lightllm/server/httpserver/pd_loop.py
@@ -197,7 +197,9 @@ def _get_load_info() -> dict:
197
198
# 获取当前每个 dp 的负载,数值含义为当前的 token 总容量使用率, 上报给 PD_Master 用于做
199
# 调度决策。
200
- current_load = [float(g_objs.shared_token_load.get_dynamic_max_load(dp_index)) for dp_index in dp_size_in_node]
+ current_load = [
201
+ float(g_objs.shared_token_load.get_dynamic_max_load(dp_index)) for dp_index in range(dp_size_in_node)
202
+ ]
203
mean_node_load = sum(current_load) / len(current_load)
204
load_info = {
205
"total_token_usage_rate": mean_node_load,
0 commit comments