From 95f41a5eb1faa56aa3347dbe429ec6700a0101c9 Mon Sep 17 00:00:00 2001 From: Yishuo Wang Date: Tue, 24 Dec 2024 17:22:14 +0800 Subject: [PATCH] fix --- python/llm/src/ipex_llm/transformers/convert.py | 1 + 1 file changed, 1 insertion(+) diff --git a/python/llm/src/ipex_llm/transformers/convert.py b/python/llm/src/ipex_llm/transformers/convert.py index 97184b29d66..9877fed0dad 100644 --- a/python/llm/src/ipex_llm/transformers/convert.py +++ b/python/llm/src/ipex_llm/transformers/convert.py @@ -1912,6 +1912,7 @@ def _optimize_post(model, lightweight_bmm=False): convert_forward(model, module.MistralModel, mistral_model_forward) convert_forward(model, module.MistralAttention, mistral_attention_forward) + convert_forward(model, module.MistralSdpaAttention, mistral_attention_forward) convert_forward(model, module.MistralRMSNorm, rms_norm_forward) convert_forward(model, module.MistralMLP, mlp_silu_forward) elif model.config.model_type == "gemma":