Skip to content

Commit 2702184

Browse files
author
wangzaijun
committed
fix
1 parent fccac43 commit 2702184

File tree

1 file changed

+1
-35
lines changed

1 file changed

+1
-35
lines changed

lightllm/server/httpserver/pd_loop.py

Lines changed: 1 addition & 35 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,6 @@
55
import socket
66
import httpx
77
import base64
8-
import zmq
98
from typing import Dict, Optional
109
from lightllm.server.pd_io_struct import NodeRole, ObjType
1110
from lightllm.server.httpserver.async_queue import AsyncQueue
@@ -34,8 +33,6 @@ async def pd_handle_loop(manager: HttpServerManager):
3433
manager.host_ip = manager.args.host
3534

3635
asyncio.create_task(timer_log(manager))
37-
if manager.pd_mode.is_NP_or_ND():
38-
asyncio.create_task(pd_handle_loop_from_d(manager))
3936

4037
id_to_handle_task: Dict[int, asyncio.Task] = {}
4138

@@ -95,8 +92,7 @@ async def _pd_handle_task(manager: HttpServerManager, pd_master_obj: PD_Master_O
9592
logger.info(f"Sent registration JSON: {regist_json}")
9693

9794
# 转发任务
98-
if manager.pd_mode != NodeRole.NP: # nixl prefill don't need up token to master
99-
forwarding_tokens_task = asyncio.create_task(_up_tokens_to_pd_master(forwarding_queue, websocket))
95+
forwarding_tokens_task = asyncio.create_task(_up_tokens_to_pd_master(forwarding_queue, websocket))
10096

10197
# 接收 pd master 发来的请求,并推理后,将生成的token转发回pd master。
10298
while True:
@@ -210,33 +206,3 @@ def _get_load_info() -> dict:
210206
"client_ip_port": f"{g_objs.httpserver_manager.host_ip}:{g_objs.args.port}",
211207
}
212208
return load_info
213-
214-
215-
async def pd_handle_loop_from_d(manager: HttpServerManager):
216-
if manager.pd_mode != NodeRole.NP:
217-
return
218-
219-
context = zmq.asyncio.Context(2)
220-
manager.recv_from_d = context.socket(zmq.PULL)
221-
manager.recv_from_d.bind(f"tcp://*:{manager.args.pd_nixl_remote_prefill_http_port}")
222-
223-
while True:
224-
try:
225-
(
226-
prompt,
227-
sampling_params,
228-
multimodal_params,
229-
) = await manager.recv_from_d.recv_pyobj()
230-
231-
# 触发推理的task
232-
async def pd_process_generate(manager: "HttpServerManager", prompt, sampling_params, multimodal_params):
233-
try:
234-
async for _, _, _, _ in manager.generate(prompt, sampling_params, multimodal_params, None):
235-
pass
236-
except BaseException as e:
237-
logger.error(str(e))
238-
239-
asyncio.create_task(pd_process_generate(manager, prompt, sampling_params, multimodal_params))
240-
241-
except Exception as e:
242-
logger.exception(f"pd loop generate error: {str(e)}")

0 commit comments

Comments
 (0)