fix load low bit com dtype (#11832)
This commit is contained in:
		
							parent
							
								
									cfc959defa
								
							
						
					
					
						commit
						6841a9ac8f
					
				
					 1 changed files with 1 additions and 1 deletions
				
			
		| 
						 | 
					@ -1845,7 +1845,7 @@ def _optimize_post(model, lightweight_bmm=False):
 | 
				
			||||||
            from ipex_llm.transformers.models.minicpmv import minicpmv_get_vision_embedding
 | 
					            from ipex_llm.transformers.models.minicpmv import minicpmv_get_vision_embedding
 | 
				
			||||||
            convert_forward(model.vpm, vpm_module.Attention, vision_transformer_attention_forward)
 | 
					            convert_forward(model.vpm, vpm_module.Attention, vision_transformer_attention_forward)
 | 
				
			||||||
            model.get_vision_embedding = MethodType(minicpmv_get_vision_embedding, model)
 | 
					            model.get_vision_embedding = MethodType(minicpmv_get_vision_embedding, model)
 | 
				
			||||||
        elif model.vpm.config.model_type == "siglip":
 | 
					        elif "siglip" in model.vpm.config.model_type:
 | 
				
			||||||
            # MiniCPM-V 2.6
 | 
					            # MiniCPM-V 2.6
 | 
				
			||||||
            from ipex_llm.transformers.models.minicpmv import siglip_attention_forward
 | 
					            from ipex_llm.transformers.models.minicpmv import siglip_attention_forward
 | 
				
			||||||
            convert_forward(model.vpm, vpm_module.SiglipAttention, siglip_attention_forward)
 | 
					            convert_forward(model.vpm, vpm_module.SiglipAttention, siglip_attention_forward)
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
		Reference in a new issue