We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 60c872d commit 7888e1dCopy full SHA for 7888e1d
vllm/platforms/tpu.py
@@ -108,12 +108,6 @@ def check_and_update_config(cls, vllm_config: VllmConfig) -> None:
108
parallel_config.worker_cls = \
109
"vllm.worker.tpu_worker.TPUWorker"
110
111
- # Adjust scheduler config for V1
112
- # TODO: Add support for these
113
- if envs.VLLM_USE_V1 and vllm_config.cache_config.enable_prefix_caching:
114
- logger.warning("[V1][TPU] Disable prefix caching")
115
- vllm_config.cache_config.enable_prefix_caching = False
116
-
117
assert not vllm_config.speculative_config, (
118
"Speculative decoding is not yet supported for TPU backend")
119
0 commit comments