We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e5af904 commit 2019b7aCopy full SHA for 2019b7a
lightllm/server/router/model_infer/mode_backend/dp_backend/control_state.py
@@ -95,6 +95,7 @@ def _normal_way(
95
if self.dp_prefill_wait_step > self.dp_prefill_wait_max_step:
96
# prefill 一次允许进行几次 decode 操作。
97
self.left_decode_num = self.decode_max_step
98
+ self.dp_prefill_wait_step = max(0, (self.dp_prefill_wait_step - self.decode_max_step))
99
return RunWay.PREFILL
100
101
if max_decode_num > 0:
0 commit comments