Skip to content

Commit 7888e1d

Browse files
authored
[V1] TPU - Enable prefix caching by default (#14773)
1 parent 60c872d commit 7888e1d

File tree

1 file changed

+0
-6
lines changed

1 file changed

+0
-6
lines changed

vllm/platforms/tpu.py

Lines changed: 0 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -108,12 +108,6 @@ def check_and_update_config(cls, vllm_config: VllmConfig) -> None:
108108
parallel_config.worker_cls = \
109109
"vllm.worker.tpu_worker.TPUWorker"
110110

111-
# Adjust scheduler config for V1
112-
# TODO: Add support for these
113-
if envs.VLLM_USE_V1 and vllm_config.cache_config.enable_prefix_caching:
114-
logger.warning("[V1][TPU] Disable prefix caching")
115-
vllm_config.cache_config.enable_prefix_caching = False
116-
117111
assert not vllm_config.speculative_config, (
118112
"Speculative decoding is not yet supported for TPU backend")
119113

0 commit comments

Comments
 (0)