Fix internvl fp16 error (#13205)

2025-06-05 11:17:44 +08:00 · 2025-06-05 11:17:44 +08:00 · 5a1c1297e1
commit 5a1c1297e1
parent 45864790f7
1 changed files with 5 additions and 1 deletions
--- a/python/llm/src/ipex_llm/vllm/xpu/model_convert.py
+++ b/python/llm/src/ipex_llm/vllm/xpu/model_convert.py
@ -133,7 +133,11 @@ def get_load_function(low_bit):
                    modules = ["vision_encoder", "embed_tokens_extend"]
                if low_bit == "fp16":
                    # to fix qwen2.5-vl and glm-4v
+                    if modules is None:
                        modules = ["vision", "visual"]
+                    else:
+                        modules.append("vision")
+                        modules.append("visual")
                optimize_model(self.model,
                               low_bit=low_bit,
                               torch_dtype=self.vllm_config.model_config.dtype,