rename BIGDL_OPTIMIZE_LM_HEAD to IPEX_LLM_LAST_LM_HEAD and add qwen2 (#11418)

2024-06-24 18:42:37 +08:00 · 2024-06-24 18:42:37 +08:00 · 9e4ee61737
commit 9e4ee61737
parent 75f836f288
1 changed files with 2 additions and 2 deletions
--- a/python/llm/src/ipex_llm/transformers/convert.py
+++ b/python/llm/src/ipex_llm/transformers/convert.py
@ -328,8 +328,8 @@ def _replace_with_low_bit_linear(model, qtype, modules_to_not_convert=None,
            optimize_lm_head = False
            if is_lm_head(name, model_config, out_features):
                model_type = getattr(model_config, "model_type", None)
-                if model_type in ["gptj", "llama"] and os.environ.get("BIGDL_OPTIMIZE_LM_HEAD",
-                                                                      None) == "1":
+                if model_type in ["gptj", "llama", "qwen2"] and \
+                        os.environ.get("IPEX_LLM_LAST_LM_HEAD", None) == "1":
                    optimize_lm_head = True
            with init_empty_weights():
                new_linear = None