diff --git a/vllm/engine/multiprocessing/engine.py b/vllm/engine/multiprocessing/engine.py index ac234d25373d..1c5972984711 100644 --- a/vllm/engine/multiprocessing/engine.py +++ b/vllm/engine/multiprocessing/engine.py @@ -229,8 +229,8 @@ def engine_step(self) -> List[RequestOutput]: """Engine step wrapper with error handling.""" try: return self.engine.step() - except SystemExit: - raise + except SystemExit as e: + raise e from None except InputProcessingError as e: # Special case where we handle an error preparing the inputs for # a single request in the batch @@ -245,7 +245,7 @@ def engine_step(self) -> List[RequestOutput]: is_engine_errored=True, exception=e) self._send_outputs(rpc_err) - raise e + raise e from None def handle_new_input(self): """Handle new input from the socket"""