vllm-project · njhill · Oct 23, 2025 · Oct 14, 2025 · Oct 22, 2025 · njhill
@@ -278,6 +278,7 @@ def schedule(self) -> SchedulerOutput:
                         token_budget += num_scheduled_tokens[preempted_req.request_id]
                         req_to_new_blocks.pop(preempted_req.request_id)
                         num_scheduled_tokens.pop(preempted_req.request_id)
+                        req_index -= 1
                 else:
                     preempted_req = self.running.pop()