move seed check to platform specific validate

NickLucche · NickLucche · commit 373333955c1a · 2025-04-10T07:45:07.000Z
Signed-off-by: NickLucche &lt;nlucches@redhat.com&gt;
diff --git a/vllm/platforms/tpu.py b/vllm/platforms/tpu.py
@@ -7,7 +7,7 @@
 import vllm.envs as envs
 from vllm.inputs import PromptType
 from vllm.logger import init_logger
-from vllm.sampling_params import SamplingParams
+from vllm.sampling_params import SamplingParams, SamplingType
 
 from .interface import Platform, PlatformEnum, _Backend
 
@@ -149,3 +149,5 @@ def validate_request(
                       SamplingParams) and params.guided_decoding is not None:
             raise ValueError("Structured output is not supported on "
                              f"{cls.device_name}.")
+        if params.sampling_type == SamplingType.RANDOM_SEED:
+            raise ValueError("Torch XLA does not support per-request seed.")
diff --git a/vllm/v1/engine/processor.py b/vllm/v1/engine/processor.py
@@ -14,10 +14,9 @@
 from vllm.multimodal.inputs import PlaceholderRange
 from vllm.multimodal.processing import EncDecMultiModalProcessor
 from vllm.multimodal.utils import merge_and_sort_multimodal_metadata
-from vllm.platforms import current_platform
 from vllm.pooling_params import PoolingParams
 from vllm.prompt_adapter.request import PromptAdapterRequest
-from vllm.sampling_params import SamplingParams, SamplingType
+from vllm.sampling_params import SamplingParams
 from vllm.transformers_utils.tokenizer_group import BaseTokenizerGroup
 from vllm.v1.engine import EngineCoreRequest
 from vllm.v1.engine.mm_input_cache import MirroredProcessingCache
@@ -78,9 +77,6 @@ def _validate_sampling_params(
         params: SamplingParams,
     ) -> None:
         self._validate_structured_output(params)
-        if (current_platform.is_tpu()
-                and params.sampling_type == SamplingType.RANDOM_SEED):
-            raise ValueError("Torch XLA does not support per-request seed.")
 
         if params.allowed_token_ids is None:
             return