From 0b57892e0e4dca0a2fb35da2a6e9944e164f12ce Mon Sep 17 00:00:00 2001 From: leonardozcm Date: Fri, 16 Aug 2024 15:48:16 +0800 Subject: [PATCH] fix load low bit com dtype --- python/llm/src/ipex_llm/transformers/convert.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/llm/src/ipex_llm/transformers/convert.py b/python/llm/src/ipex_llm/transformers/convert.py index 2ce495f0232..82ad27eb853 100644 --- a/python/llm/src/ipex_llm/transformers/convert.py +++ b/python/llm/src/ipex_llm/transformers/convert.py @@ -1845,7 +1845,7 @@ def safe_bmm_fwd(*args, **kwargs): from ipex_llm.transformers.models.minicpmv import minicpmv_get_vision_embedding convert_forward(model.vpm, vpm_module.Attention, vision_transformer_attention_forward) model.get_vision_embedding = MethodType(minicpmv_get_vision_embedding, model) - elif model.vpm.config.model_type == "siglip": + elif "siglip" in model.vpm.config.model_type: # MiniCPM-V 2.6 from ipex_llm.transformers.models.minicpmv import siglip_attention_forward convert_forward(model.vpm, vpm_module.SiglipAttention, siglip_attention_forward)