File tree Expand file tree Collapse file tree 2 files changed +2
-11
lines changed
lightllm/server/router/model_infer
mode_backend/continues_batch/pd_mode/decode_node_impl Expand file tree Collapse file tree 2 files changed +2
-11
lines changed Original file line number Diff line number Diff line change @@ -49,16 +49,7 @@ def init_custom(self):
4949 return
5050
5151 def prefill (self , reqs : List [Tuple ]):
52- # 当 dp_size 不等于 1 的时候,需要提前从发来的请求参数中
53- # 剔除掉不需要处理的请求参数, deepseekv2 这种特殊的模型
54- # 在 dp 模式下 tp_rank == dp_rank
55- if self .dp_size != 1 :
56- cur_dp_index = self .tp_rank
57- reqs = [req for req in reqs if req [3 ] == cur_dp_index ]
58-
59- g_infer_state_lock .acquire ()
60- g_infer_context .add_reqs (reqs , init_req_obj = False ) # 请求对象进行延迟初始化
61- g_infer_state_lock .release ()
52+ self ._init_reqs (reqs , init_req_obj = False )
6253 return
6354
6455 def decode (self ):
Original file line number Diff line number Diff line change @@ -305,7 +305,7 @@ async def start_model_process(
305305):
306306 import lightllm .utils .rpyc_fix_utils as _
307307
308- # 单卡时不使用 rpc
308+ # 单卡单机时不使用 rpc
309309 if node_world_size == 1 and args .nnodes == 1 :
310310 return ModelRpcServer (
311311 args ,
You can’t perform that action at this time.
0 commit comments