We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 3c1f724 commit ea8aca3Copy full SHA for ea8aca3
lightllm/server/router/manager.py
@@ -291,6 +291,7 @@ async def _step(self):
291
new_mini_batch = self.req_queue.generate_new_batch(self.running_batch)
292
self.has_wait_tokens = 0
293
if new_mini_batch is not None:
294
+ self.has_wait_tokens = self.max_wait_tokens
295
self.stats_tool.count_prompt_tokens(new_mini_batch)
296
await self._prefill_batch(new_mini_batch)
297
if not new_mini_batch.is_clear():
0 commit comments