Add half precision for fastchat models (#11130)

This commit is contained in:
Guancheng Fu 2024-05-24 15:41:14 +08:00 committed by GitHub
parent 65f4212f89
commit 7f772c5a4f
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -91,6 +91,8 @@ def load_model(
if device == "xpu": if device == "xpu":
import intel_extension_for_pytorch as ipex import intel_extension_for_pytorch as ipex
print("Convert model to half precision...")
model = model.half()
model = model.to('xpu') model = model.to('xpu')
return model, tokenizer return model, tokenizer