fix load low bit com dtype (#11832)
This commit is contained in:
parent
cfc959defa
commit
6841a9ac8f
1 changed files with 1 additions and 1 deletions
|
|
@ -1845,7 +1845,7 @@ def _optimize_post(model, lightweight_bmm=False):
|
||||||
from ipex_llm.transformers.models.minicpmv import minicpmv_get_vision_embedding
|
from ipex_llm.transformers.models.minicpmv import minicpmv_get_vision_embedding
|
||||||
convert_forward(model.vpm, vpm_module.Attention, vision_transformer_attention_forward)
|
convert_forward(model.vpm, vpm_module.Attention, vision_transformer_attention_forward)
|
||||||
model.get_vision_embedding = MethodType(minicpmv_get_vision_embedding, model)
|
model.get_vision_embedding = MethodType(minicpmv_get_vision_embedding, model)
|
||||||
elif model.vpm.config.model_type == "siglip":
|
elif "siglip" in model.vpm.config.model_type:
|
||||||
# MiniCPM-V 2.6
|
# MiniCPM-V 2.6
|
||||||
from ipex_llm.transformers.models.minicpmv import siglip_attention_forward
|
from ipex_llm.transformers.models.minicpmv import siglip_attention_forward
|
||||||
convert_forward(model.vpm, vpm_module.SiglipAttention, siglip_attention_forward)
|
convert_forward(model.vpm, vpm_module.SiglipAttention, siglip_attention_forward)
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue