This commit is contained in:
Yishuo Wang 2024-08-07 09:39:46 +08:00 committed by GitHub
parent e32d13d78c
commit c093f7d980
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -61,7 +61,8 @@ def pre_compute_inv_freq(module: torch.nn.Module):
module.base ** module.base **
(torch.arange(0, module.dim, 2, dtype=torch.int64).float() / module.dim) (torch.arange(0, module.dim, 2, dtype=torch.int64).float() / module.dim)
) )
else: elif module.__class__.__name__ in ["Phi3SuScaledRotaryEmbedding",
"Phi3LongRoPEScaledRotaryEmbedding"]:
inv_freq_shape = torch.arange(0, module.dim, 2, dtype=torch.int64).float() / module.dim inv_freq_shape = torch.arange(0, module.dim, 2, dtype=torch.int64).float() / module.dim
short_ext_factors = torch.tensor(module.short_factor, dtype=torch.float32) short_ext_factors = torch.tensor(module.short_factor, dtype=torch.float32)
module.inv_freq = 1.0 / (short_ext_factors * module.base ** inv_freq_shape) module.inv_freq = 1.0 / (short_ext_factors * module.base ** inv_freq_shape)