Skip to content

Commit 8a82ac4

Browse files
committed
bugfix: skip cancelled requests when processing stream output. (#289)
1 parent cda8541 commit 8a82ac4

File tree

1 file changed

+6
-1
lines changed

1 file changed

+6
-1
lines changed

xllm/core/scheduler/continuous_scheduler.cpp

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1025,8 +1025,13 @@ void ContinuousScheduler::process_batch_output(bool enable_schedule_overlap) {
10251025
for (auto request : to_be_processed_requests) {
10261026
// ignore cancelled/finished requests when enable_schedule_overlap.
10271027
if (options_.enable_schedule_overlap() && request->state().stream) {
1028-
if (!request->finished() && !request->cancelled()) {
1028+
// skip cancelled request
1029+
if (request->cancelled()) {
1030+
continue;
1031+
}
1032+
if (!request->finished()) {
10291033
stream_requests.emplace_back(request);
1034+
continue;
10301035
}
10311036
// handle token when last token not be handled.
10321037
if (request->finished() && !request->last_token_handled()) {

0 commit comments

Comments
 (0)