diff --git a/python/ray/llm/_internal/batch/stages/vllm_engine_stage.py b/python/ray/llm/_internal/batch/stages/vllm_engine_stage.py index f5fad0aaa91e..cc9ee2d07e7f 100644 --- a/python/ray/llm/_internal/batch/stages/vllm_engine_stage.py +++ b/python/ray/llm/_internal/batch/stages/vllm_engine_stage.py @@ -275,9 +275,6 @@ async def _prepare_llm_request(self, row: Dict[str, Any]) -> vLLMEngineRequest: if self.task_type == vLLMTaskType.GENERATE: sampling_params = row.pop("sampling_params") if "guided_decoding" in sampling_params: - if self.vllm_use_v1: - raise ValueError("Guided decoding is only supported with vLLM v0") - guided_decoding = vllm.sampling_params.GuidedDecodingParams( **maybe_convert_ndarray_to_list( sampling_params.pop("guided_decoding")