diff --git a/python/llm/src/ipex_llm/transformers/npu_models/mp_models_base.py b/python/llm/src/ipex_llm/transformers/npu_models/mp_models_base.py index a1dac609243..b25a3dae0fe 100644 --- a/python/llm/src/ipex_llm/transformers/npu_models/mp_models_base.py +++ b/python/llm/src/ipex_llm/transformers/npu_models/mp_models_base.py @@ -470,7 +470,7 @@ def layer_norm(self, hidden_states, layernorm_weight): ) eps = self.constant(self.rms_norm_eps) hidden_states = self.eltwise_div(hidden_states, self.sqrt(self.eltwise_add(variance, eps))) - layernorm_weight = self.convert_to_fp32(layernorm_weight) + hidden_states = self.convert_to_fp16(hidden_states) hidden_states = self.eltwise_mul(layernorm_weight, hidden_states) hidden_states = self.convert_to_fp16(hidden_states) return hidden_states