Skip to content

Commit 6bfa066

Browse files
NickLuccheyangw-dev
authored andcommitted
[TPU][V1] Make --disable_chunked_mm_input mandatory for serving MM models (vllm-project#16483)
Signed-off-by: NickLucche <nlucches@redhat.com> Signed-off-by: Yang Wang <elainewy@meta.com>
1 parent 35c6b47 commit 6bfa066

File tree

1 file changed

+7
-0
lines changed

1 file changed

+7
-0
lines changed

vllm/platforms/tpu.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -120,6 +120,13 @@ def check_and_update_config(cls, vllm_config: VllmConfig) -> None:
120120
assert not vllm_config.speculative_config, (
121121
"Speculative decoding is not yet supported for TPU backend")
122122

123+
if scheduler_config.is_multimodal_model and not \
124+
scheduler_config.disable_chunked_mm_input:
125+
logger.warning("TPU does not support running Multimodal models"\
126+
" without setting `--disable_chunked_mm_input`. " \
127+
"Forcing --disable_chunked_mm_input.")
128+
scheduler_config.disable_chunked_mm_input = True
129+
123130
@classmethod
124131
def is_pin_memory_available(cls):
125132
logger.warning("Pin memory is not supported on TPU.")

0 commit comments

Comments
 (0)