Skip to content

Commit d038f96

Browse files
author
root
committed
update
1 parent 2dae795 commit d038f96

File tree

2 files changed

+7
-2
lines changed

2 files changed

+7
-2
lines changed

lightllm/server/router/manager.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -397,7 +397,9 @@ def _add_req(self, group_req_indexes: GroupReqIndexes):
397397

398398
def _generate_new_batch(self):
399399
# 调度的时候需要考虑当前运行的batch,和调度了但是暂时还没有推理的部分请求。
400-
new_batch = self.req_queue.generate_new_batch(self.schedule_new_batch)
400+
new_batch = self.req_queue.generate_new_batch(
401+
Batch.merge_two_batch(self.running_batch, self.schedule_new_batch)
402+
)
401403
self.schedule_new_batch = Batch.merge_two_batch(self.schedule_new_batch, new_batch)
402404
return
403405

lightllm/server/router/req_queue/dp_balancer/dp_base_balancer.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,6 @@ class DpBalancer(ABC):
1717
def __init__(self, dp_size_in_node: int, inner_queues: List[BaseQueue]):
1818
self.dp_size_in_node = dp_size_in_node
1919
self.inner_queues = inner_queues
20-
self.pre_select_dp_index = self.dp_size_in_node - 1
2120

2221
@abstractmethod
2322
def assign_reqs_to_dp(self, current_batch: Batch, reqs_waiting_for_dp_index: List[Union[Req, List[Req]]]) -> None:
@@ -30,6 +29,10 @@ class RoundRobinDpBalancer(DpBalancer):
3029
在队列长度最小的DP中进行轮询选择
3130
"""
3231

32+
def __init__(self, dp_size_in_node: int, inner_queues: List[BaseQueue]):
33+
super().__init__(dp_size_in_node, inner_queues)
34+
self.pre_select_dp_index = self.dp_size_in_node - 1
35+
3336
def get_suggest_dp_index(
3437
self,
3538
) -> int:

0 commit comments

Comments
 (0)