From bd1e490d62a1b174575ed6da4a6de768c8c07e37 Mon Sep 17 00:00:00 2001 From: Yishuo Wang Date: Wed, 21 Aug 2024 10:31:41 +0800 Subject: [PATCH] fix phi3 (#11878) --- python/llm/src/ipex_llm/transformers/models/phi3.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/llm/src/ipex_llm/transformers/models/phi3.py b/python/llm/src/ipex_llm/transformers/models/phi3.py index bfa380c2..0b7f873e 100644 --- a/python/llm/src/ipex_llm/transformers/models/phi3.py +++ b/python/llm/src/ipex_llm/transformers/models/phi3.py @@ -277,7 +277,7 @@ def phi3_model_forward_wrapper(origin_model_forward): head_dim = self.config.hidden_size // self.config.num_attention_heads past_key_values = DynamicNormalCache.from_reserved( n_layer, inputs.size(0), n_head, inputs.size(1), head_dim, - inputs.dtype, inputs.device + self.dtype, inputs.device ) return origin_model_forward( self=self,