From c8c7d56e5008ec3c33f119f3d03c7f4f6bb5983d Mon Sep 17 00:00:00 2001 From: quanliu <18646313696@163.com> Date: Sun, 12 Oct 2025 22:09:45 +0800 Subject: [PATCH] [Bugfix][Core]remove preempted_req in req_to_new_blocks and num_scheduled_tokens Signed-off-by: quanliu <18646313696@163.com> --- vllm/v1/core/sched/scheduler.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/vllm/v1/core/sched/scheduler.py b/vllm/v1/core/sched/scheduler.py index 0f1504724d7c..365d1b13a9bf 100644 --- a/vllm/v1/core/sched/scheduler.py +++ b/vllm/v1/core/sched/scheduler.py @@ -273,6 +273,9 @@ def schedule(self) -> SchedulerOutput: self.running.remove(preempted_req) if preempted_req in scheduled_running_reqs: scheduled_running_reqs.remove(preempted_req) + token_budget += num_scheduled_tokens[preempted_req.request_id] + req_to_new_blocks.pop(preempted_req.request_id) + num_scheduled_tokens.pop(preempted_req.request_id) else: preempted_req = self.running.pop()