From 78f8504a3c5ec80f00413d934feb6848bd3d866c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=BC=80=E5=93=B2?= Date: Fri, 11 Apr 2025 17:36:47 +0800 Subject: [PATCH] bug fix, add seq_id_to_seq_group clearing to avoid memory leak when sample param n>1 MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 开哲 --- vllm/outputs.py | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/vllm/outputs.py b/vllm/outputs.py index 014e8d5d8823..413f7c0eb653 100644 --- a/vllm/outputs.py +++ b/vllm/outputs.py @@ -173,6 +173,13 @@ def from_seq_group( group.finish_seq(seq_group) if assembled_seq_group is None: return None + + # clear finished seq in seq_id_to_seq_group + if len(group.to_be_finished) == 0: + for sub_request_id in list(group.seq_id_to_index.keys()): + if sub_request_id in seq_id_to_seq_group: + del seq_id_to_seq_group[sub_request_id] + return cls.from_seq_group(assembled_seq_group, use_cache, seq_id_to_seq_group)