LLM: add enable_xetla parameter for optimize_model API (#10753)
This commit is contained in:
parent
3590e1be83
commit
3d561b60ac
1 changed files with 2 additions and 1 deletions
|
|
@ -253,7 +253,8 @@ def optimize_model(model, low_bit='sym_int4', optimize_llm=True, modules_to_not_
|
|||
optimize_model=optimize_llm,
|
||||
modules_to_not_convert=modules_to_not_convert,
|
||||
cpu_embedding=cpu_embedding,
|
||||
lightweight_bmm=lightweight_bmm)
|
||||
lightweight_bmm=lightweight_bmm,
|
||||
enable_xetla=kwargs.pop("enable_xetla", False))
|
||||
# add save_low_bit to pretrained model dynamically
|
||||
import types
|
||||
model._bigdl_config = dict()
|
||||
|
|
|
|||
Loading…
Reference in a new issue