From 9c10ff7ea732a1e0ea216cedce799f796784f2c1 Mon Sep 17 00:00:00 2001 From: Nick Hill Date: Fri, 5 Sep 2025 16:49:45 -0700 Subject: [PATCH] [Bugfix] Catch and log invalid token ids in detokenizer Signed-off-by: Nick Hill --- vllm/v1/engine/detokenizer.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/vllm/v1/engine/detokenizer.py b/vllm/v1/engine/detokenizer.py index 0ccbe6549349..38f435f5166e 100644 --- a/vllm/v1/engine/detokenizer.py +++ b/vllm/v1/engine/detokenizer.py @@ -233,6 +233,11 @@ def decode_next(self, next_token_id: int) -> str: def _protected_step(self, next_token_id: int) -> Optional[str]: try: token = self.stream.step(self.tokenizer, next_token_id) + except OverflowError: + # Handle rare observed overflow, still to be diagnosed. + # See https://github.com/vllm-project/vllm/issues/21951. + logger.exception("Encountered invalid token id: %d", next_token_id) + token = None except Exception as e: if not str(e).startswith(INVALID_PREFIX_ERR_MSG): raise e