diff --git a/python/llm/src/ipex_llm/transformers/npu_models/minicpmv_mp.py b/python/llm/src/ipex_llm/transformers/npu_models/minicpmv_mp.py index 9817ef4a181..8d60eded3ef 100644 --- a/python/llm/src/ipex_llm/transformers/npu_models/minicpmv_mp.py +++ b/python/llm/src/ipex_llm/transformers/npu_models/minicpmv_mp.py @@ -198,7 +198,7 @@ def forward(self, x): @module_optimization def replace_with_Layernorm(layer, qtype=None, device='NPU', - modules_to_not_convert=[], group_size=0): + modules_to_not_convert=[], group_size=0, imatrix=None): if isinstance(layer, torch.nn.LayerNorm): return MinicpmVLayerNorm( weight=layer.weight.to(torch.float16),