Skip to content

Commit fb1c40b

Browse files
committed
修复decode节点init req 代码重复。
1 parent 46d0b13 commit fb1c40b

File tree

2 files changed

+2
-11
lines changed

2 files changed

+2
-11
lines changed

lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/decode_node_impl/decode_impl.py

Lines changed: 1 addition & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -49,16 +49,7 @@ def init_custom(self):
4949
return
5050

5151
def prefill(self, reqs: List[Tuple]):
52-
# 当 dp_size 不等于 1 的时候,需要提前从发来的请求参数中
53-
# 剔除掉不需要处理的请求参数, deepseekv2 这种特殊的模型
54-
# 在 dp 模式下 tp_rank == dp_rank
55-
if self.dp_size != 1:
56-
cur_dp_index = self.tp_rank
57-
reqs = [req for req in reqs if req[3] == cur_dp_index]
58-
59-
g_infer_state_lock.acquire()
60-
g_infer_context.add_reqs(reqs, init_req_obj=False) # 请求对象进行延迟初始化
61-
g_infer_state_lock.release()
52+
self._init_reqs(reqs, init_req_obj=False)
6253
return
6354

6455
def decode(self):

lightllm/server/router/model_infer/model_rpc.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -305,7 +305,7 @@ async def start_model_process(
305305
):
306306
import lightllm.utils.rpyc_fix_utils as _
307307

308-
# 单卡时不使用 rpc
308+
# 单卡单机时不使用 rpc
309309
if node_world_size == 1 and args.nnodes == 1:
310310
return ModelRpcServer(
311311
args,

0 commit comments

Comments
 (0)