Skip to content

Commit ad0012a

Browse files
Revert "[Bugfix] Fix MRoPE Errors in the Qwen-VL Model When Processing Pure Text (vllm-project#18407)" (vllm-project#18456)
Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
1 parent 92247c5 commit ad0012a

File tree

1 file changed

+8
-0
lines changed

1 file changed

+8
-0
lines changed

vllm/worker/model_runner.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -729,6 +729,8 @@ def _compute_multi_modal_input(self, inter_data: InterDataForSeqGroup,
729729
mm_kwargs, placeholder_maps = MultiModalPlaceholderMap.from_seq_group(
730730
seq_group_metadata,
731731
range(positions[0], positions[0] + len(positions)))
732+
if not mm_kwargs:
733+
return
732734

733735
inter_data.multi_modal_kwargs = mm_kwargs
734736
inter_data.multi_modal_placeholder_maps = placeholder_maps
@@ -739,6 +741,12 @@ def _compute_multi_modal_input(self, inter_data: InterDataForSeqGroup,
739741
video_grid_thw = mm_kwargs.get("video_grid_thw", None)
740742
audio_feature_lengths = mm_kwargs.get("audio_feature_lengths",
741743
None)
744+
assert (
745+
image_grid_thw is not None or video_grid_thw is not None
746+
or audio_feature_lengths is not None), (
747+
"mrope embedding type requires multi-modal input mapper "
748+
"returns 'image_grid_thw' or 'video_grid_thw' or "
749+
"'audio_feature_lengths'.")
742750

743751
second_per_grid_ts = mm_kwargs.get("second_per_grid_ts", None)
744752
use_audio_in_video = mm_kwargs.get("use_audio_in_video", False)

0 commit comments

Comments
 (0)