diff --git a/python/llm/src/ipex_llm/transformers/npu_model.py b/python/llm/src/ipex_llm/transformers/npu_model.py index 15605d07..9dbbd1b8 100644 --- a/python/llm/src/ipex_llm/transformers/npu_model.py +++ b/python/llm/src/ipex_llm/transformers/npu_model.py @@ -429,11 +429,10 @@ class _BaseAutoModelClass: os.path.join(pretrained_model_name_or_path, "config.json"), trust_remote_code=trust_remote_code) with torch.device('meta'): - model = transformers.AutoModelForCausalLM.from_config( + model = cls.HF_Model.from_config( config, trust_remote_code=trust_remote_code) try: model_ptr = load_model_from_file(pretrained_model_name_or_path) - model.config = config model.model_ptr = model_ptr model.save_directory = pretrained_model_name_or_path model.kv_len = config_dict['kv_len']