From 59ae9d9739d62fc45d2a43fb9fb3e9b2a2c4fb24 Mon Sep 17 00:00:00 2001 From: kcz358 Date: Tue, 31 Dec 2024 09:57:39 +0000 Subject: [PATCH] Support navit processor --- lmms_eval/models/kino.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/lmms_eval/models/kino.py b/lmms_eval/models/kino.py index ae7793e5..3fb60100 100644 --- a/lmms_eval/models/kino.py +++ b/lmms_eval/models/kino.py @@ -89,7 +89,10 @@ def get_w(weights, keyword): eval_logger.info(f"Loaded audio_modal_projector weights from {pretrained_mlp_projector}. Incompatible keys: {incompatible_keys}") self.pretrained = pretrained - self._processor = KinoProcessor.from_pretrained("Evo-LMM/kino-7b-init", revision=revision, trust_remote_code=trust_remote_code) + if self.model.config.vision_aspect_ratio == "navit": + self._processor = KinoProcessor.from_pretrained("Evo-LMM/kino-maas-7B_v12_18000_init", revision=revision, trust_remote_code=trust_remote_code) + else: + self._processor = KinoProcessor.from_pretrained("Evo-LMM/kino-7b-init", revision=revision, trust_remote_code=trust_remote_code) # Pad from left for batched generation: https://huggingface.co/docs/transformers/v4.39.3/en/model_doc/llava#usage-tips self._processor.tokenizer.padding_side = "left" self._tokenizer = self._processor.tokenizer