We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d890c3c commit 6aab772Copy full SHA for 6aab772
vllm/v1/core/sched/scheduler.py
@@ -271,6 +271,9 @@ def schedule(self) -> SchedulerOutput:
271
self.running.remove(preempted_req)
272
if preempted_req in scheduled_running_reqs:
273
scheduled_running_reqs.remove(preempted_req)
274
+ token_budget += num_scheduled_tokens[preempted_req.request_id]
275
+ req_to_new_blocks.pop(preempted_req.request_id)
276
+ num_scheduled_tokens.pop(preempted_req.request_id)
277
else:
278
preempted_req = self.running.pop()
279
0 commit comments