hotfix qwen2-7b weight setting (#11991)

2024-09-02 18:11:08 +08:00 · 2024-09-02 18:11:08 +08:00 · 2f3d1bd0ec
commit 2f3d1bd0ec
parent a40ea7038d
1 changed files with 1 additions and 0 deletions
--- a/python/llm/src/ipex_llm/transformers/npu_models/qwen2_mp.py
+++ b/python/llm/src/ipex_llm/transformers/npu_models/qwen2_mp.py
@ -587,6 +587,7 @@ def run_decode(
                (attn_layer.v_proj.weight, attn_layer.v_proj.scale),
                (attn_layer.o_proj.weight, attn_layer.o_proj.scale),
                (mlp_layer.gate_proj.weight, mlp_layer.gate_proj.scale),
                (mlp_layer.up_proj.weight, mlp_layer.up_proj.scale),
                (mlp_layer.down_proj_0.weight, mlp_layer.down_proj_0.scale),
                (mlp_layer.down_proj_1.weight, mlp_layer.down_proj_1.scale)
            ]