LLM: add enable_xetla parameter for optimize_model API (#10753)
This commit is contained in:
parent
3590e1be83
commit
3d561b60ac
1 changed files with 2 additions and 1 deletions
|
|
@ -253,7 +253,8 @@ def optimize_model(model, low_bit='sym_int4', optimize_llm=True, modules_to_not_
|
||||||
optimize_model=optimize_llm,
|
optimize_model=optimize_llm,
|
||||||
modules_to_not_convert=modules_to_not_convert,
|
modules_to_not_convert=modules_to_not_convert,
|
||||||
cpu_embedding=cpu_embedding,
|
cpu_embedding=cpu_embedding,
|
||||||
lightweight_bmm=lightweight_bmm)
|
lightweight_bmm=lightweight_bmm,
|
||||||
|
enable_xetla=kwargs.pop("enable_xetla", False))
|
||||||
# add save_low_bit to pretrained model dynamically
|
# add save_low_bit to pretrained model dynamically
|
||||||
import types
|
import types
|
||||||
model._bigdl_config = dict()
|
model._bigdl_config = dict()
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue