diff --git a/python/llm/src/ipex_llm/transformers/loader.py b/python/llm/src/ipex_llm/transformers/loader.py index acaddb7a..7eaf679c 100644 --- a/python/llm/src/ipex_llm/transformers/loader.py +++ b/python/llm/src/ipex_llm/transformers/loader.py @@ -91,6 +91,8 @@ def load_model( if device == "xpu": import intel_extension_for_pytorch as ipex + print("Convert model to half precision...") + model = model.half() model = model.to('xpu') return model, tokenizer