From 59ae9d9739d62fc45d2a43fb9fb3e9b2a2c4fb24 Mon Sep 17 00:00:00 2001
From: kcz358 <kaichenzhang358@outlook.com>
Date: Tue, 31 Dec 2024 09:57:39 +0000
Subject: [PATCH] Support navit processor

---
 lmms_eval/models/kino.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/lmms_eval/models/kino.py b/lmms_eval/models/kino.py
index ae7793e55..3fb601001 100644
--- a/lmms_eval/models/kino.py
+++ b/lmms_eval/models/kino.py
@@ -89,7 +89,10 @@ def get_w(weights, keyword):
             eval_logger.info(f"Loaded audio_modal_projector weights from {pretrained_mlp_projector}. Incompatible keys: {incompatible_keys}")
 
         self.pretrained = pretrained
-        self._processor = KinoProcessor.from_pretrained("Evo-LMM/kino-7b-init", revision=revision, trust_remote_code=trust_remote_code)
+        if self.model.config.vision_aspect_ratio == "navit":
+            self._processor = KinoProcessor.from_pretrained("Evo-LMM/kino-maas-7B_v12_18000_init", revision=revision, trust_remote_code=trust_remote_code)
+        else:
+            self._processor = KinoProcessor.from_pretrained("Evo-LMM/kino-7b-init", revision=revision, trust_remote_code=trust_remote_code)
         # Pad from left for batched generation: https://huggingface.co/docs/transformers/v4.39.3/en/model_doc/llava#usage-tips
         self._processor.tokenizer.padding_side = "left"
         self._tokenizer = self._processor.tokenizer