diff --git a/python/llm/src/ipex_llm/transformers/npu_models/qwen2_mp.py b/python/llm/src/ipex_llm/transformers/npu_models/qwen2_mp.py index c6cb74c8..e1c6f9b8 100644 --- a/python/llm/src/ipex_llm/transformers/npu_models/qwen2_mp.py +++ b/python/llm/src/ipex_llm/transformers/npu_models/qwen2_mp.py @@ -587,6 +587,7 @@ def run_decode( (attn_layer.v_proj.weight, attn_layer.v_proj.scale), (attn_layer.o_proj.weight, attn_layer.o_proj.scale), (mlp_layer.gate_proj.weight, mlp_layer.gate_proj.scale), + (mlp_layer.up_proj.weight, mlp_layer.up_proj.scale), (mlp_layer.down_proj_0.weight, mlp_layer.down_proj_0.scale), (mlp_layer.down_proj_1.weight, mlp_layer.down_proj_1.scale) ]