We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9c62060 commit 50a3a08Copy full SHA for 50a3a08
xllm/core/scheduler/continuous_scheduler.cpp
@@ -1019,8 +1019,13 @@ void ContinuousScheduler::process_batch_output(bool enable_schedule_overlap) {
1019
for (auto request : to_be_processed_requests) {
1020
// ignore cancelled/finished requests when enable_schedule_overlap.
1021
if (options_.enable_schedule_overlap() && request->state().stream) {
1022
- if (!request->finished() && !request->cancelled()) {
+ // skip cancelled request
1023
+ if (request->cancelled()) {
1024
+ continue;
1025
+ }
1026
+ if (!request->finished()) {
1027
stream_requests.emplace_back(request);
1028
1029
}
1030
// handle token when last token not be handled.
1031
if (request->finished() && !request->last_token_handled()) {
0 commit comments