This commit is contained in:
Yishuo Wang 2024-08-21 10:31:41 +08:00 committed by GitHub
parent eab6f6dde4
commit bd1e490d62
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -277,7 +277,7 @@ def phi3_model_forward_wrapper(origin_model_forward):
head_dim = self.config.hidden_size // self.config.num_attention_heads head_dim = self.config.hidden_size // self.config.num_attention_heads
past_key_values = DynamicNormalCache.from_reserved( past_key_values = DynamicNormalCache.from_reserved(
n_layer, inputs.size(0), n_head, inputs.size(1), head_dim, n_layer, inputs.size(0), n_head, inputs.size(1), head_dim,
inputs.dtype, inputs.device self.dtype, inputs.device
) )
return origin_model_forward( return origin_model_forward(
self=self, self=self,