diff --git a/src/transformers/models/llava_next_video/modeling_llava_next_video.py b/src/transformers/models/llava_next_video/modeling_llava_next_video.py index b73b2f6994d9a8..46b9b23bd66b04 100644 --- a/src/transformers/models/llava_next_video/modeling_llava_next_video.py +++ b/src/transformers/models/llava_next_video/modeling_llava_next_video.py @@ -908,6 +908,7 @@ def forward( image_features, feature_lens = self.pack_image_features( image_features, image_sizes, + self.vision_feature_select_strategy, image_newline=self.image_newline, ) diff --git a/src/transformers/models/llava_next_video/modular_llava_next_video.py b/src/transformers/models/llava_next_video/modular_llava_next_video.py index f0ec4578e4883d..f48056cfb97e22 100644 --- a/src/transformers/models/llava_next_video/modular_llava_next_video.py +++ b/src/transformers/models/llava_next_video/modular_llava_next_video.py @@ -413,6 +413,7 @@ def forward( image_features, feature_lens = self.pack_image_features( image_features, image_sizes, + self.vision_feature_select_strategy, image_newline=self.image_newline, )