[NPU] Hot fix of load_low_bit (#12344)

This commit is contained in:
binbin Deng 2024-11-06 10:07:00 +08:00 committed by GitHub
parent 899a30331a
commit 69e3a56943
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -549,7 +549,7 @@ class _BaseAutoModelClass:
from ipex_llm.transformers.npu_models.convert_mp import optimize_llm
optimize_llm(
llm,
max_output_len=max_context_len,
max_context_len=max_context_len,
max_prompt_len=max_prompt_len,
inter_pp=inter_pp,
intra_pp=intra_pp,