Skip to content

Commit 63ac326

Browse files
committed
fix
1 parent 65b0770 commit 63ac326

File tree

2 files changed

+5
-24
lines changed

2 files changed

+5
-24
lines changed

lightllm/server/router/req_queue/base_queue.py

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -26,11 +26,6 @@ def __init__(self, args, router, dp_index, dp_size_in_node) -> None:
2626
self.router_token_ratio = args.router_token_ratio # ratio to determine whether the router is busy
2727
self.router_max_new_token_len = args.router_max_new_token_len
2828

29-
def append(self, req: Req):
30-
req.sample_params.suggested_dp_index = self.dp_index
31-
self.waiting_req_list.append(req)
32-
return
33-
3429
def extend(self, req_group: List[Req]):
3530
for req in req_group:
3631
req.sample_params.suggested_dp_index = self.dp_index

lightllm/server/router/req_queue/dp_base_queue.py

Lines changed: 5 additions & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -32,16 +32,11 @@ def get_wait_req_num(self):
3232

3333
# @calculate_time(show=True, min_cost_ms=10)
3434
def generate_new_batch(self, current_batch: Batch):
35-
try:
36-
self.dp_balancer.assign_reqs_to_dp(current_batch, self.reqs_waiting_for_dp_index)
37-
batches = [
38-
self.inner_queues[dp_index].generate_new_batch(current_batch)
39-
for dp_index in range(self.dp_size_in_node)
40-
]
41-
return self._merge_batch(batches)
42-
except Exception as e:
43-
logger.error(f"generate new batch failed: {e}")
44-
raise e
35+
self.dp_balancer.assign_reqs_to_dp(current_batch, self.reqs_waiting_for_dp_index)
36+
batches = [
37+
self.inner_queues[dp_index].generate_new_batch(current_batch) for dp_index in range(self.dp_size_in_node)
38+
]
39+
return self._merge_batch(batches)
4540

4641
def _merge_batch(self, dp_batches: List[Batch]):
4742
merged_batch: Batch = None
@@ -52,15 +47,6 @@ def _merge_batch(self, dp_batches: List[Batch]):
5247
merged_batch = iter_batch
5348
return merged_batch
5449

55-
def append(self, req: Req):
56-
suggested_dp_index = req.sample_params.suggested_dp_index
57-
if suggested_dp_index >= self.dp_size_in_node or suggested_dp_index < 0:
58-
# 在调度时,统一分配请求id
59-
self.reqs_waiting_for_dp_index.append([req])
60-
else:
61-
self.inner_queues[suggested_dp_index].append(req)
62-
return
63-
6450
def extend(self, req_group: List[Req]):
6551
suggested_dp_index = req_group[0].sample_params.suggested_dp_index
6652
if suggested_dp_index >= self.dp_size_in_node or suggested_dp_index < 0:

0 commit comments

Comments
 (0)