LLM: add enable_xetla parameter for optimize_model API (#10753)
				
					
				
			This commit is contained in:
		
							parent
							
								
									3590e1be83
								
							
						
					
					
						commit
						3d561b60ac
					
				
					 1 changed files with 2 additions and 1 deletions
				
			
		| 
						 | 
				
			
			@ -253,7 +253,8 @@ def optimize_model(model, low_bit='sym_int4', optimize_llm=True, modules_to_not_
 | 
			
		|||
                                 optimize_model=optimize_llm,
 | 
			
		||||
                                 modules_to_not_convert=modules_to_not_convert,
 | 
			
		||||
                                 cpu_embedding=cpu_embedding,
 | 
			
		||||
                                 lightweight_bmm=lightweight_bmm)
 | 
			
		||||
                                 lightweight_bmm=lightweight_bmm,
 | 
			
		||||
                                 enable_xetla=kwargs.pop("enable_xetla", False))
 | 
			
		||||
    # add save_low_bit to pretrained model dynamically
 | 
			
		||||
    import types
 | 
			
		||||
    model._bigdl_config = dict()
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
		Loading…
	
		Reference in a new issue