We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 71018fb commit b88537aCopy full SHA for b88537a
fastdeploy/output/token_processor.py
@@ -329,8 +329,9 @@ def _process_batch_output(self):
329
if recovery_stop:
330
llm_logger.info(f"recovery stop signal found at task {task_id}")
331
if not recovery_stop and token_id < 0:
332
- if task_id in self.resource_manager.to_be_rescheduled_request_id_set:
333
- self.resource_manager.reschedule_preempt_task(task_id)
+ if envs.ENABLE_V1_KVCACHE_SCHEDULER:
+ if task_id in self.resource_manager.to_be_rescheduled_request_id_set:
334
+ self.resource_manager.reschedule_preempt_task(task_id)
335
continue
336
337
if task.get("prefill_chunk_info", None) is not None:
0 commit comments