diff --git a/python/llm/src/ipex_llm/transformers/npu_model.py b/python/llm/src/ipex_llm/transformers/npu_model.py index 07faed4f..c37aca8b 100644 --- a/python/llm/src/ipex_llm/transformers/npu_model.py +++ b/python/llm/src/ipex_llm/transformers/npu_model.py @@ -549,7 +549,7 @@ class _BaseAutoModelClass: from ipex_llm.transformers.npu_models.convert_mp import optimize_llm optimize_llm( llm, - max_output_len=max_context_len, + max_context_len=max_context_len, max_prompt_len=max_prompt_len, inter_pp=inter_pp, intra_pp=intra_pp,